火车采集器软件交流官方论坛

 找回密码
 加入会员
搜索
火车采集器V9版免费下载火车浏览器 - 可视采集,万能群发,全自动脚本工具
楼主: 272070210

火车头免费版伪原创插件+娱乐新闻伪原创采集规则1条

[复制链接]
发表于 2011-5-26 12:20:50 | 显示全部楼层
看看是什么好东西
发表于 2011-5-26 12:22:04 | 显示全部楼层
看看看看看看看看看看看看看看看看
发表于 2011-5-26 13:47:19 | 显示全部楼层
抱着试试看的态度
发表于 2011-5-26 14:13:06 | 显示全部楼层
我也要看啊
发表于 2011-5-26 14:15:34 | 显示全部楼层
<?xml version="1.0" encoding="utf-8"?>
<!--Created by LocoySpider.exe! 2011-05-05 10:04:46-->
<config>
  <任务>
    <ruleversion>2010</ruleversion>
    <spiderurl>True</spiderurl>
    <spidercontent>True</spidercontent>
    <outcontent>False</outcontent>
    <spiderstep>1</spiderstep>
    <sourceencode>GB2312</sourceencode>
    <starturl>http://ent.163.com/special/00031HA3/dalunews.html</starturl>
    <usespeciallink>True</usespeciallink>
    <usedisablesystemlink>True</usedisablesystemlink>
    <scriptlink>&lt;li&gt;&lt;h5&gt;&lt;a href="[参数]"&gt;</scriptlink>
    <truelink>http://www.zp189.com/locoyseo.php?seo=[参数1]</truelink>
    <listpagemust>
    </listpagemust>
    <listpageforbid>
    </listpageforbid>
    <httpmethod>GET</httpmethod>
    <httppostdata>
    </httppostdata>
    <contentpagemust>html</contentpagemust>
    <contentpageforbid>#</contentpageforbid>
    <listurlstart>
    </listurlstart>
    <listurlend>
    </listurlend>
    <contenturlstart>
    </contenturlstart>
    <contenturlend>
    </contenturlend>
    <dividepagestyle>0</dividepagestyle>
    <dividepagestart>
    </dividepagestart>
    <dividepageend>
    </dividepageend>
    <usemanualstyle>False</usemanualstyle>
    <manualpagestyle>
    </manualpagestyle>
    <manualpageurl>
    </manualpageurl>
    <dividejoincode>
    </dividejoincode>
    <matchdeal>1</matchdeal>
    <testpageurl>http://www.zp189.com/locoyseo.php?seo=http://ent.163.com/11/0504/06/736J5HAI00031H2L.html</testpageurl>
    <useurlencode>True</useurlencode>
    <usebacksort>True</usebacksort>
    <usefirstthumb>False</usefirstthumb>
    <bannedthumb>
    </bannedthumb>
    <maxoutpernum>0</maxoutpernum>
    <updatetype>1</updatetype>
    <update1num>0</update1num>
    <update2week>1</update2week>
    <update3time>
    </update3time>
    <update4interval>10</update4interval>
    <update4start>
    </update4start>
    <update4end>
    </update4end>
    <starttime>
    </starttime>
    <databasesetting>-1</databasesetting>
    <databasesqlsetting>-1</databasesqlsetting>
    <spiderthreadnum>1</spiderthreadnum>
    <outthreadnum>3</outthreadnum>
    <spiderinterval>5000</spiderinterval>
    <outinterval>400</outinterval>
    <successoutsign>0</successoutsign>
    <jobvar1>
    </jobvar1>
    <jobvar2>
    </jobvar2>
    <bak1>备注:发布模块采集规则插件定制QQ:272070210</bak1>
    <postpagestart>1</postpagestart>
    <postpageend>3</postpageend>
    <useautoidentify>False</useautoidentify>
    <usemanualencode>False</usemanualencode>
    <usemanualcookie>False</usemanualcookie>
    <checkrepeat>True</checkrepeat>
    <useradomsort>False</useradomsort>
    <useasyncdownload>True</useasyncdownload>
    <outinterval2>500</outinterval2>
    <posthash>
    </posthash>
    <pluginslist>不使用插件</pluginslist>
    <plugincontent>不使用插件</plugincontent>
    <pluginspages>不使用插件</pluginspages>
    <pluginssave>不使用插件</pluginssave>
    <filefilter>
    </filefilter>
    <flashdic>
    </flashdic>
    <imagedir>
    </imagedir>
    <otherdir>
    </otherdir>
    <usedownthumb>False</usedownthumb>
  </任务>
  <标签>
    <标签0 labelname="标题" useregex="False" regexexp="" startstr="&lt;title&gt;" endstr="_" belongpage="默认页" regextrim="&amp;(*);○(组图)○(图)○ 图" regexreplace="" htmltrim="0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23" downimg="False" downswf="False" downotherfile="False" onlyfetchvalidurl="False" filenamemust="" spiderdatastyle="0" manuladatastyle="0" manualstring="" manualtime="0" manualtimestr="yyyy年MM月dd日 hh时mm分ss秒" radomstringlib="0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz" radomstringlength="8" radomnumstart="1" radomnumend="1000" splitlabel="标题" splitsep="," splitnum="5" summarynum="1000" summarylabel="内容" bak1="" pinyinlabel="标题" pinyinsep="-" useautotranslate="False" labelincicle="False" regexcombine="" incrementstart="1" incrementradomnumstart="1" incrementradomnumend="1" usegbktobig5="False" usebig5togbk="False" labelcontentmust="" labelcontentforbid="" fillrelativeurl="False" htmlexclude="True" usemarstext="False" labelnotnull="True" labelinpage="False" savefileformat="yyyyMMddHHmmss[自增ID]" labelnotrepeat="True" labelorder="0" listlabel="False" />
    <标签1 labelname="内容" useregex="False" regexexp="" startstr="&lt;div id=&quot;endText&quot;&gt;" endstr="&lt;a href=&quot;http://ent.163.com/&quot;" belongpage="默认页" regextrim="&lt;!--(*)--&gt;" regexreplace="" htmltrim="0,1,2,3,6,7,8,10,14,15,16,17,18,19,20,21,22" downimg="False" downswf="False" downotherfile="False" onlyfetchvalidurl="False" filenamemust="" spiderdatastyle="0" manuladatastyle="0" manualstring="" manualtime="0" manualtimestr="yyyy年MM月dd日 hh时mm分ss秒" radomstringlib="0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz" radomstringlength="8" radomnumstart="1" radomnumend="1000" splitlabel="标题" splitsep="," splitnum="5" summarynum="1000" summarylabel="内容" bak1="" pinyinlabel="标题" pinyinsep="-" useautotranslate="False" labelincicle="False" regexcombine="" incrementstart="1" incrementradomnumstart="1" incrementradomnumend="1" usegbktobig5="False" usebig5togbk="False" labelcontentmust="" labelcontentforbid="" fillrelativeurl="False" htmlexclude="True" usemarstext="False" labelnotnull="True" labelinpage="False" savefileformat="yyyyMMddHHmmss[自增ID]" labelnotrepeat="False" labelorder="1" listlabel="False" />
  </标签>
</config>
发表于 2011-5-26 21:29:59 | 显示全部楼层
好东东啊,谢谢!
发表于 2011-5-27 03:30:48 | 显示全部楼层
发表于 2011-5-27 11:04:39 | 显示全部楼层
我也看一下呀,谢谢你的共享精神
发表于 2011-5-28 17:53:27 | 显示全部楼层
发表于 2011-5-28 20:23:19 | 显示全部楼层
回复看看~~~~~~~~~~
您需要登录后才可以回帖 登录 | 加入会员

本版积分规则

QQ|手机版|Archiver|火车采集器官方站 ( 皖ICP备06000549 )

GMT+8, 2025-9-6 15:49

Powered by Discuz! X3.4

Copyright © 2001-2020, Tencent Cloud.

快速回复 返回顶部 返回列表