亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來到蟲蟲下載站! | ?? 資源下載 ?? 資源專輯 ?? 關于我們
? 蟲蟲下載站

?? abstractfrontier.html

?? 網絡爬蟲開源代碼
?? HTML
?? 第 1 頁 / 共 5 頁
字號:
<a name="556" href="#556">556</a>             }<a name="557" href="#557">557</a>         }<a name="558" href="#558">558</a>         <em class="comment">// save ignored items (if any) where they can be consulted later</em><a name="559" href="#559">559</a>         saveIgnoredItems(ignoredWriter.toString(), controller.getDisk());<a name="560" href="#560">560</a>         logger.info(<span class="string">"finished"</span>);<a name="561" href="#561">561</a>     }<a name="562" href="#562">562</a> <a name="563" href="#563">563</a>     <em>/**<em>*</em></em><a name="564" href="#564">564</a> <em>     * Dump ignored seed items (if any) to disk; delete file otherwise.</em><a name="565" href="#565">565</a> <em>     * Static to allow non-derived sibling classes (frontiers not yet </em><a name="566" href="#566">566</a> <em>     * subclassed here) to reuse.</em><a name="567" href="#567">567</a> <em>     * </em><a name="568" href="#568">568</a> <em>     * @param ignoredItems</em><a name="569" href="#569">569</a> <em>     * @param dir </em><a name="570" href="#570">570</a> <em>     */</em><a name="571" href="#571">571</a>     <strong>public</strong> <strong>static</strong> <strong>void</strong> saveIgnoredItems(String ignoredItems, File dir) {<a name="572" href="#572">572</a>         File ignoredFile = <strong>new</strong> File(dir, IGNORED_SEEDS_FILENAME);<a name="573" href="#573">573</a>         <strong>if</strong>(ignoredItems==<strong>null</strong> | ignoredItems.length()>0) {<a name="574" href="#574">574</a>             <strong>try</strong> {<a name="575" href="#575">575</a>                 BufferedWriter bw = <strong>new</strong> BufferedWriter(<strong>new</strong> FileWriter(ignoredFile));<a name="576" href="#576">576</a>                 bw.write(ignoredItems);<a name="577" href="#577">577</a>                 bw.close();<a name="578" href="#578">578</a>             } <strong>catch</strong> (IOException e) {<a name="579" href="#579">579</a>                 <em class="comment">// TODO make an alert?</em><a name="580" href="#580">580</a>                 e.printStackTrace();<a name="581" href="#581">581</a>             }<a name="582" href="#582">582</a>         } <strong>else</strong> {<a name="583" href="#583">583</a>             <em class="comment">// delete any older file (if any)</em><a name="584" href="#584">584</a>             ignoredFile.delete();<a name="585" href="#585">585</a>         }<a name="586" href="#586">586</a>     }<a name="587" href="#587">587</a> <a name="588" href="#588">588</a>     <strong>protected</strong> <a href="../../../../org/archive/crawler/datamodel/CrawlURI.html">CrawlURI</a> asCrawlUri(<a href="../../../../org/archive/crawler/datamodel/CandidateURI.html">CandidateURI</a> caUri) {<a name="589" href="#589">589</a>         <a href="../../../../org/archive/crawler/datamodel/CrawlURI.html">CrawlURI</a> curi;<a name="590" href="#590">590</a>         <strong>if</strong> (caUri instanceof CrawlURI) {<a name="591" href="#591">591</a>             curi = (CrawlURI)caUri;<a name="592" href="#592">592</a>         } <strong>else</strong> {<a name="593" href="#593">593</a>             curi = CrawlURI.from(caUri, nextOrdinal.getAndIncrement());<a name="594" href="#594">594</a>         }<a name="595" href="#595">595</a>         curi.setClassKey(getClassKey(curi));<a name="596" href="#596">596</a>         <strong>return</strong> curi;<a name="597" href="#597">597</a>     }<a name="598" href="#598">598</a> <a name="599" href="#599">599</a>     <em>/**<em>*</em></em><a name="600" href="#600">600</a> <em>     * @param now</em><a name="601" href="#601">601</a> <em>     * @throws InterruptedException</em><a name="602" href="#602">602</a> <em>     * @throws EndedException</em><a name="603" href="#603">603</a> <em>     */</em><a name="604" href="#604">604</a>     <strong>protected</strong> <strong>synchronized</strong> <strong>void</strong> preNext(<strong>long</strong> now) throws InterruptedException,<a name="605" href="#605">605</a>             <a href="../../../../org/archive/crawler/framework/exceptions/EndedException.html">EndedException</a> {<a name="606" href="#606">606</a>         <strong>if</strong> (<strong>this</strong>.controller == <strong>null</strong>) {<a name="607" href="#607">607</a>             <strong>return</strong>;<a name="608" href="#608">608</a>         }<a name="609" href="#609">609</a>         <a name="610" href="#610">610</a>         <em class="comment">// Check completion conditions</em><a name="611" href="#611">611</a>         <strong>if</strong> (<strong>this</strong>.controller.atFinish()) {<a name="612" href="#612">612</a>             <strong>if</strong> (((Boolean)getUncheckedAttribute(<strong>null</strong>, ATTR_PAUSE_AT_FINISH))<a name="613" href="#613">613</a>                     .booleanValue()) {<a name="614" href="#614">614</a>                 <strong>this</strong>.controller.requestCrawlPause();<a name="615" href="#615">615</a>             } <strong>else</strong> {<a name="616" href="#616">616</a>                 <strong>this</strong>.controller.beginCrawlStop();<a name="617" href="#617">617</a>             }<a name="618" href="#618">618</a>         }<a name="619" href="#619">619</a> <a name="620" href="#620">620</a>         <em class="comment">// enforce operator pause</em><a name="621" href="#621">621</a>         <strong>if</strong> (shouldPause) {<a name="622" href="#622">622</a>             <strong>while</strong> (shouldPause) {<a name="623" href="#623">623</a>                 <strong>this</strong>.controller.toePaused();<a name="624" href="#624">624</a>                 wait();<a name="625" href="#625">625</a>             }<a name="626" href="#626">626</a>             <em class="comment">// exitted pause; possibly finish regardless of pause-at-finish</em><a name="627" href="#627">627</a>             <strong>if</strong> (controller != <strong>null</strong> &amp;&amp; controller.atFinish()) {<a name="628" href="#628">628</a>                 <strong>this</strong>.controller.beginCrawlStop();<a name="629" href="#629">629</a>             }<a name="630" href="#630">630</a>         }<a name="631" href="#631">631</a> <a name="632" href="#632">632</a>         <em class="comment">// enforce operator terminate or thread retirement</em><a name="633" href="#633">633</a>         <strong>if</strong> (shouldTerminate<a name="634" href="#634">634</a>                 || ((ToeThread)Thread.currentThread()).shouldRetire()) {<a name="635" href="#635">635</a>             <strong>throw</strong> <strong>new</strong> <a href="../../../../org/archive/crawler/framework/exceptions/EndedException.html">EndedException</a>(<span class="string">"terminated"</span>);<a name="636" href="#636">636</a>         }<a name="637" href="#637">637</a> <a name="638" href="#638">638</a>         enforceBandwidthThrottle(now);<a name="639" href="#639">639</a>     }<a name="640" href="#640">640</a> <a name="641" href="#641">641</a>     <em>/**<em>*</em></em><a name="642" href="#642">642</a> <em>     * Perform any special handling of the CrawlURI, such as promoting its URI</em><a name="643" href="#643">643</a> <em>     * to seed-status, or preferencing it because it is an embed.</em><a name="644" href="#644">644</a> <em>     * </em><a name="645" href="#645">645</a> <em>     * @param curi</em><a name="646" href="#646">646</a> <em>     */</em><a name="647" href="#647">647</a>     <strong>protected</strong> <strong>void</strong> applySpecialHandling(<a href="../../../../org/archive/crawler/datamodel/CrawlURI.html">CrawlURI</a> curi) {<a name="648" href="#648">648</a>         <strong>if</strong> (curi.isSeed() &amp;&amp; curi.getVia() != <strong>null</strong><a name="649" href="#649">649</a>                 &amp;&amp; curi.flattenVia().length() > 0) {<a name="650" href="#650">650</a>             <em class="comment">// The only way a seed can have a non-empty via is if it is the</em><a name="651" href="#651">651</a>             <em class="comment">// result of a seed redirect. Add it to the seeds list.</em><a name="652" href="#652">652</a>             <em class="comment">//</em><a name="653" href="#653">653</a>             <em class="comment">// This is a feature. This is handling for case where a seed</em><a name="654" href="#654">654</a>             <em class="comment">// gets immediately redirected to another page. What we're doing is</em><a name="655" href="#655">655</a>             <em class="comment">// treating the immediate redirect target as a seed.</em><a name="656" href="#656">656</a>             <strong>this</strong>.controller.getScope().addSeed(curi);<a name="657" href="#657">657</a>             <em class="comment">// And it needs rapid scheduling.</em><a name="658" href="#658">658</a> 	    <strong>if</strong> (curi.getSchedulingDirective() == CandidateURI.NORMAL)<a name="659" href="#659">659</a>                 curi.setSchedulingDirective(CandidateURI.MEDIUM);<a name="660" href="#660">660</a>         }<a name="661" href="#661">661</a> <a name="662" href="#662">662</a>         <em class="comment">// optionally preferencing embeds up to MEDIUM</em><a name="663" href="#663">663</a>         <strong>int</strong> prefHops = ((Integer)getUncheckedAttribute(curi,<a name="664" href="#664">664</a>                 ATTR_PREFERENCE_EMBED_HOPS)).intValue();<a name="665" href="#665">665</a>         <strong>if</strong> (prefHops > 0) {<a name="666" href="#666">666</a>             <strong>int</strong> embedHops = curi.getTransHops();<a name="667" href="#667">667</a>             <strong>if</strong> (embedHops > 0 &amp;&amp; embedHops &lt;= prefHops<a name="668" href="#668">668</a>                     &amp;&amp; curi.getSchedulingDirective() == CandidateURI.NORMAL) {<a name="669" href="#669">669</a>                 <em class="comment">// number of embed hops falls within the preferenced range, and</em><a name="670" href="#670">670</a>                 <em class="comment">// uri is not already MEDIUM -- so promote it</em><a name="671" href="#671">671</a>                 curi.setSchedulingDirective(CandidateURI.MEDIUM);<a name="672" href="#672">672</a>             }<a name="673" href="#673">673</a>         }<a name="674" href="#674">674</a>     }<a name="675" href="#675">675</a> <a name="676" href="#676">676</a>     <em>/**<em>*</em></em><a name="677" href="#677">677</a> <em>     * Perform fixups on a CrawlURI about to be returned via next().</em><a name="678" href="#678">678</a> <em>     * </em><a name="679" href="#679">679</a> <em>     * @param curi</em><a name="680" href="#680">680</a> <em>     *            CrawlURI about to be returned by next()</em><a name="681" href="#681">681</a> <em>     * @param q</em><a name="682" href="#682">682</a> <em>     *            the queue from which the CrawlURI came</em><a name="683" href="#683">683</a> <em>     */</em><a name="684" href="#684">684</a>     <strong>protected</strong> <strong>void</strong> noteAboutToEmit(<a href="../../../../org/archive/crawler/datamodel/CrawlURI.html">CrawlURI</a> curi, <a href="../../../../org/archive/crawler/frontier/WorkQueue.html">WorkQueue</a> q) {<a name="685" href="#685">685</a>         curi.setHolder(q);<a name="686" href="#686">686</a>         <em class="comment">// if (curi.getServer() == null) {</em><a name="687" href="#687">687</a>         <em class="comment">//    // TODO: perhaps short-circuit the emit here,</em><a name="688" href="#688">688</a>         <em class="comment">//    // because URI will be rejected as unfetchable</em><a name="689" href="#689">689</a>         <em class="comment">// }</em><a name="690" href="#690">690</a>         doJournalEmitted(curi);<a name="691" href="#691">691</a>     }<a name="692" href="#692">692</a> <a name="693" href="#693">693</a>     <em>/**<em>*</em></em><a name="694" href="#694">694</a> <em>     * @param curi</em><a name="695" href="#695">695</a> <em>     * @return the CrawlServer to be associated with this CrawlURI</em><

?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
国产 欧美在线| 国产一区二区影院| 亚洲日本一区二区| 国产精品理论片| 国产精品国产精品国产专区不片| 国产农村妇女毛片精品久久麻豆 | 26uuu国产电影一区二区| 91精品婷婷国产综合久久竹菊| 欧美三级电影网站| 6080yy午夜一二三区久久| 欧美日韩国产色站一区二区三区| 欧美性xxxxx极品少妇| 欧美日韩一区中文字幕| 欧美片网站yy| 日韩你懂的在线观看| 欧美成人一区二区| 国产午夜一区二区三区| 自拍视频在线观看一区二区| 依依成人精品视频| 视频一区二区中文字幕| 精品伊人久久久久7777人| 国产在线国偷精品免费看| 成人免费毛片嘿嘿连载视频| 97se亚洲国产综合自在线不卡| 色噜噜狠狠成人中文综合| 制服视频三区第一页精品| 精品国产免费久久| 国产精品久久久久久妇女6080 | 精品视频1区2区3区| 欧美一区二区三区免费在线看 | 国产精品一区免费在线观看| 成人高清在线视频| 欧美吻胸吃奶大尺度电影| 欧美一区二区三区在线电影| 中文字幕欧美国产| 亚洲成人av一区二区三区| 久久99热狠狠色一区二区| 成人小视频在线观看| 欧美日韩精品三区| 久久精品人人做人人爽人人| 亚洲综合免费观看高清完整版 | 亚洲免费观看视频| 免费观看日韩av| 91丨九色porny丨蝌蚪| 日韩欧美国产麻豆| 一区二区三区免费在线观看| 激情久久五月天| 精品视频资源站| 中文字幕一区二区三| 美日韩一区二区三区| 色婷婷综合久久| 国产午夜亚洲精品理论片色戒 | 欧美猛男超大videosgay| 中文一区在线播放| 久久精品国内一区二区三区| 在线区一区二视频| 国产精品久久久久影院| 国产一区二区三区四区五区入口 | 亚洲国产精品传媒在线观看| 日韩精品成人一区二区在线| 一本久道中文字幕精品亚洲嫩| 国产婷婷精品av在线| 国产在线视频一区二区| 欧美顶级少妇做爰| 午夜私人影院久久久久| 在线观看91视频| 亚洲已满18点击进入久久| 99精品久久久久久| 国产精品高清亚洲| www.99精品| 自拍偷拍亚洲综合| 日本韩国精品一区二区在线观看| 国产精品理论片在线观看| 波多野结衣在线一区| 国产精品嫩草影院av蜜臀| 国产福利91精品一区二区三区| 精品国产一区二区三区忘忧草| 美女视频黄a大片欧美| 日韩欧美不卡一区| 久久99国产精品成人| 欧美成人猛片aaaaaaa| 狠狠狠色丁香婷婷综合久久五月| 欧美一区二区三区精品| 蜜臀av性久久久久蜜臀aⅴ| 在线综合+亚洲+欧美中文字幕| 三级久久三级久久| 欧美大片免费久久精品三p| 国产乱对白刺激视频不卡| 国产偷v国产偷v亚洲高清| 99r精品视频| 国产精品国产精品国产专区不片 | 欧美色图激情小说| 五月婷婷综合在线| 欧美一级黄色录像| 成人综合在线观看| 亚洲午夜精品在线| 日韩免费观看高清完整版 | 亚洲国产欧美在线| 日韩一区二区三区电影| 久久精品国产999大香线蕉| 久久久精品中文字幕麻豆发布| 国产一区高清在线| 亚洲视频在线观看一区| 91精品国产免费| 国产精选一区二区三区| 亚洲久草在线视频| 日韩欧美一级特黄在线播放| 丁香婷婷综合五月| 亚洲一区二区免费视频| 欧美mv日韩mv国产| 在线精品视频一区二区三四| 激情综合五月婷婷| 亚洲综合自拍偷拍| 日韩欧美在线观看一区二区三区| 九色综合国产一区二区三区| 国产精品久久久久久户外露出 | 久久久www成人免费无遮挡大片 | 亚洲国产美国国产综合一区二区| 欧美一区二区三区的| k8久久久一区二区三区| 日韩精品电影在线观看| 亚洲素人一区二区| 26uuu国产电影一区二区| 欧美性猛交xxxxxx富婆| 成人午夜视频福利| 秋霞午夜鲁丝一区二区老狼| 中文字幕一区在线观看| 欧美不卡视频一区| 欧美日韩一区二区三区免费看| 国产一区二区三区免费看| 亚洲大片一区二区三区| 中文av一区特黄| 久久先锋影音av鲁色资源| 日韩三级精品电影久久久| 色综合久久88色综合天天免费| 国产一区二区三区最好精华液| 视频一区免费在线观看| 亚洲国产精品尤物yw在线观看| 国产精品电影一区二区三区| 久久亚洲欧美国产精品乐播| 日韩午夜小视频| 欧美久久久一区| 欧美视频一区在线观看| 91福利资源站| 色激情天天射综合网| 色噜噜狠狠成人中文综合| 色中色一区二区| 色8久久精品久久久久久蜜| 99热精品一区二区| 99久久综合精品| gogo大胆日本视频一区| 成人黄动漫网站免费app| 国产精品99久久久久久久女警 | 国产精品毛片高清在线完整版| 欧美v日韩v国产v| 精品福利av导航| 国产亚洲视频系列| 中文字幕精品综合| 中文字幕一区二区三区不卡在线| 中文字幕视频一区二区三区久| 国产精品久久久99| 亚洲精品一卡二卡| 亚洲国产成人高清精品| 亚州成人在线电影| 日本伊人午夜精品| 久久国产婷婷国产香蕉| 国产精品影视天天线| 波多野结衣精品在线| 一本大道久久a久久综合婷婷| 色视频成人在线观看免| 欧美一三区三区四区免费在线看| 日韩午夜av一区| 欧美高清在线视频| 伊人色综合久久天天| 亚洲成人免费在线| 国产在线精品国自产拍免费| av激情综合网| 欧美精品aⅴ在线视频| 欧美成人一区二区三区片免费| 国产精品伦理在线| 午夜不卡av免费| 国产精品一色哟哟哟| 日本二三区不卡| 精品国产乱码久久久久久久| 国产精品久久久久影视| 五月综合激情网| 99久久综合色| 日韩免费性生活视频播放| 1区2区3区国产精品| 五月天激情小说综合| 成人黄色一级视频| 91麻豆精品国产91久久久久| 国产人妖乱国产精品人妖| 亚洲妇熟xx妇色黄| 国产传媒久久文化传媒| 欧美精品在线观看一区二区| 国产精品卡一卡二卡三| 国内一区二区视频| 欧美无乱码久久久免费午夜一区| 国产日产欧美一区|