亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來到蟲蟲下載站! | ?? 資源下載 ?? 資源專輯 ?? 關于我們
? 蟲蟲下載站

?? experimentalwarcwriter.java

?? 爬蟲
?? JAVA
?? 第 1 頁 / 共 2 頁
字號:
/*  $Id: ExperimentalWARCWriter.java,v 1.21 2006/09/06 05:38:18 stack-sf Exp $ * * Created on July 27th, 2006 * * Copyright (C) 2006 Internet Archive. * * This file is part of the Heritrix web crawler (crawler.archive.org). * * Heritrix is free software; you can redistribute it and/or modify * it under the terms of the GNU Lesser Public License as published by * the Free Software Foundation; either version 2.1 of the License, or * any later version. * * Heritrix is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the * GNU Lesser Public License for more details. * * You should have received a copy of the GNU Lesser Public License * along with Heritrix; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA */package org.archive.io.warc;import java.io.ByteArrayInputStream;import java.io.ByteArrayOutputStream;import java.io.File;import java.io.IOException;import java.io.InputStream;import java.io.OutputStream;import java.net.URI;import java.net.URISyntaxException;import java.text.DecimalFormat;import java.text.NumberFormat;import java.util.Iterator;import java.util.List;import java.util.Map;import java.util.concurrent.atomic.AtomicInteger;import org.archive.io.UTF8Bytes;import org.archive.io.WriterPoolMember;import org.archive.uid.GeneratorFactory;import org.archive.util.ArchiveUtils;import org.archive.util.anvl.ANVLRecord;/** * <b>Experimental</b> WARC implementation. *  * Based on unreleased version 0.9 of <a  * href="http://archive-access.sourceforge.net//warc/warc_file_format.html">WARC * File Format</a> document.  Specification and implementation subject to * change. * * <p>Assumption is that the caller is managing access to this * ExperimentalWARCWriter ensuring only one thread accessing this WARC instance * at any one time. *  * <p>While being written, WARCs have a '.open' suffix appended. * * @author stack * @version $Revision: 1.21 $ $Date: 2006/09/06 05:38:18 $ */public class ExperimentalWARCWriter extends WriterPoolMemberimplements WARCConstants {    /**     * Buffer to reuse writing streams.     */    private final byte [] readbuffer = new byte[16 * 1024];        /**     * NEWLINE as bytes.     */    public static byte [] CRLF_BYTES;    static {        try {            CRLF_BYTES = CRLF.getBytes(DEFAULT_ENCODING);        } catch(Exception e) {            e.printStackTrace();        }    };        /**     * Formatter for the length.     */    private static NumberFormat RECORD_LENGTH_FORMATTER =        new DecimalFormat(PLACEHOLDER_RECORD_LENGTH_STRING);        /**     * Metadata.     * TODO: Exploit writing warcinfo record.  Currently unused.     */    private final List fileMetadata;            /**     * Shutdown Constructor     * Has default access so can make instance to test utility methods.     */    ExperimentalWARCWriter() {        this(null, null, "", "", true, -1, null);    }        /**     * Constructor.     * Takes a stream. Use with caution. There is no upperbound check on size.     * Will just keep writing.  Only pass Streams that are bounded.      * @param serialNo  used to generate unique file name sequences     * @param out Where to write.     * @param f File the <code>out</code> is connected to.     * @param cmprs Compress the content written.     * @param a14DigitDate If null, we'll write current time.     * @throws IOException     */    public ExperimentalWARCWriter(final AtomicInteger serialNo,    		final OutputStream out, final File f,    		final boolean cmprs, final String a14DigitDate,            final List warcinfoData)    throws IOException {        super(serialNo, out, f, cmprs, a14DigitDate);        // TODO: Currently unused.        this.fileMetadata = warcinfoData;    }                /**     * Constructor.     *     * @param dirs Where to drop files.     * @param prefix File prefix to use.     * @param cmprs Compress the records written.      * @param maxSize Maximum size for ARC files written.     * @param suffix File tail to use.  If null, unused.     * @param warcinfoData File metadata for warcinfo record.     */    public ExperimentalWARCWriter(final AtomicInteger serialNo,    		final List<File> dirs, final String prefix,             final String suffix, final boolean cmprs,            final int maxSize, final List warcinfoData) {        super(serialNo, dirs, prefix, suffix, cmprs, maxSize,        	WARC_FILE_EXTENSION);        // TODO: Currently unused.        this.fileMetadata = warcinfoData;    }        @Override    protected String createFile(File file) throws IOException {    	String filename = super.createFile(file);    	writeWarcinfoRecord(filename);        return filename;    }        protected void baseCharacterCheck(final char c, final String parameter)    throws IOException {        // TODO: Too strict?  UNICODE control characters?        if (Character.isISOControl(c) || !Character.isValidCodePoint(c)) {            throw new IOException("Contains illegal character 0x" +                Integer.toHexString(c) + ": " + parameter);        }    }        protected String checkHeaderLineParameters(final String parameter)    throws IOException {        for (int i = 0; i < parameter.length(); i++) {        	final char c = parameter.charAt(i);        	baseCharacterCheck(c, parameter);        	if (Character.isWhitespace(c)) {                throw new IOException("Contains disallowed white space 0x" +                    Integer.toHexString(c) + ": " + parameter);        	}        }        return parameter;    }        protected String checkHeaderLineMimetypeParameter(final String parameter)    throws IOException {    	StringBuilder sb = new StringBuilder(parameter.length());    	boolean wasWhitespace = false;        for (int i = 0; i < parameter.length(); i++) {        	char c = parameter.charAt(i);        	if (Character.isWhitespace(c)) {        		// Map all to ' ' and collapse multiples into one.        		// TODO: Make sure white space occurs in legal location --        		// before parameter or inside quoted-string.        		if (wasWhitespace) {        			continue;        		}        		wasWhitespace = true;        		c = ' ';        	} else {        		wasWhitespace = false;        		baseCharacterCheck(c, parameter);        	}        	sb.append(c);        }                return sb.toString();    }    protected byte [] createRecordHeaderline(final String type,    		final String url, final String create14DigitDate,    		final String mimetype, final URI recordId,    		final int namedFieldsLength, final long contentLength)    throws IOException {    	final StringBuilder sb =    		new StringBuilder(2048/*A SWAG: TODO: Do analysis.*/);    	sb.append(WARC_ID);    	sb.append(HEADER_FIELD_SEPARATOR);    	sb.append(PLACEHOLDER_RECORD_LENGTH_STRING);    	sb.append(HEADER_FIELD_SEPARATOR);    	sb.append(type);    	sb.append(HEADER_FIELD_SEPARATOR);    	sb.append(checkHeaderLineParameters(url));    	sb.append(HEADER_FIELD_SEPARATOR);    	sb.append(checkHeaderLineParameters(create14DigitDate));    	sb.append(HEADER_FIELD_SEPARATOR);    	// 0.9 of spec. has mimetype second-to-last and recordid last on    	// header line.  Here we swap their positions and allow writing    	// of full mimetypes rather than the curtailed type we used write into    	// ARCs.  These two deviations to be proposed as amendments to spec 0.9.    	sb.append(checkHeaderLineParameters(recordId.toString()));    	sb.append(HEADER_FIELD_SEPARATOR);    	sb.append(checkHeaderLineMimetypeParameter(mimetype));        // Add terminating CRLF.        sb.append(CRLF);    	    	long length = sb.length() + namedFieldsLength + contentLength;    	

?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
国产999精品久久| 麻豆91精品视频| 欧美激情一区在线观看| 欧美mv和日韩mv的网站| 日韩精品一区在线| 日韩精品中文字幕一区| 日韩精品一区二区在线| 日韩美女天天操| 久久久久九九视频| 国产日韩欧美a| 国产精品久久久久影院色老大| 久久精品视频一区二区三区| 国产欧美一区二区精品仙草咪 | 国产河南妇女毛片精品久久久| 蜜桃91丨九色丨蝌蚪91桃色| 久久99久国产精品黄毛片色诱| 蜜桃一区二区三区在线| 国产一区二区三区视频在线播放| 国产成人午夜视频| 成人av在线资源网| 在线观看亚洲一区| 欧美一区二区三区免费大片| 欧美精品一区二区三区很污很色的 | 久久国产精品99久久人人澡| 狠狠色丁香婷婷综合久久片| 成人国产电影网| 在线观看视频一区二区 | 精品一区免费av| 国产美女精品在线| 91在线观看免费视频| 欧美日韩一卡二卡三卡 | 欧美激情一区二区三区四区| 最新日韩在线视频| 日韩高清不卡一区二区| 国产精品18久久久久久久久久久久 | 粗大黑人巨茎大战欧美成人| 91麻豆成人久久精品二区三区| 91麻豆精品久久久久蜜臀| 26uuu国产日韩综合| 亚洲日本成人在线观看| 日韩中文字幕区一区有砖一区| 国产精品77777| 欧美一区二区三区视频在线观看| 国产蜜臀av在线一区二区三区| 亚洲成人动漫av| 成人黄色软件下载| 欧美成人午夜电影| 亚洲综合在线观看视频| 国产一区二三区好的| 欧美日韩一区二区在线观看视频 | 成人小视频在线观看| 欧美日韩不卡在线| 五月综合激情网| 国产成人亚洲综合a∨婷婷| 欧美日韩国产高清一区二区| 亚洲欧洲成人精品av97| 久久国产精品一区二区| 在线不卡免费av| 亚洲综合免费观看高清在线观看 | 1区2区3区国产精品| 捆绑调教一区二区三区| 欧美日韩一区二区在线观看视频 | 欧美色国产精品| 亚洲色图清纯唯美| 成人性生交大片免费看视频在线 | 成人一区二区三区在线观看 | 黄页网站大全一区二区| 在线成人午夜影院| 亚洲成人自拍偷拍| 91成人国产精品| 一区二区三区不卡视频在线观看| 粉嫩绯色av一区二区在线观看| 精品乱码亚洲一区二区不卡| 日韩高清在线观看| 91精品在线麻豆| 奇米精品一区二区三区在线观看一| 欧美中文字幕亚洲一区二区va在线 | 日韩精品自拍偷拍| 久久精品国产一区二区三| 欧美人牲a欧美精品| 午夜精品一区二区三区免费视频 | 99久久国产综合精品麻豆| 中文字幕第一区综合| 成人蜜臀av电影| 亚洲日本在线观看| 色女孩综合影院| 亚洲第一搞黄网站| 欧美一区二区三区在线看| 久久精品99国产国产精| 久久人人97超碰com| 成人网页在线观看| 亚洲乱码一区二区三区在线观看| 色婷婷激情一区二区三区| 一区二区三区四区高清精品免费观看| 欧美在线影院一区二区| 五月婷婷欧美视频| 久久久久青草大香线综合精品| 国产成人99久久亚洲综合精品| 亚洲欧美一区二区视频| 欧美在线观看一区| 久久精品国产精品亚洲精品| 国产欧美精品一区二区色综合朱莉| 成人午夜免费视频| 午夜影视日本亚洲欧洲精品| 日韩午夜在线影院| 成人精品国产福利| 亚洲一区在线观看免费观看电影高清| 日韩一区二区麻豆国产| 国产成人一级电影| 亚洲超碰精品一区二区| 精品国产精品网麻豆系列| 不卡的电影网站| 偷拍一区二区三区| 亚洲国产精品高清| 正在播放亚洲一区| 成人动漫在线一区| 久久电影网站中文字幕| 亚洲日本va在线观看| 日韩免费在线观看| www成人在线观看| www.66久久| 麻豆精品视频在线| 亚洲一区二区免费视频| 久久久久免费观看| 欧美一区二区播放| 色猫猫国产区一区二在线视频| 久久国产精品露脸对白| 亚洲国产精品麻豆| 国产精品久久久爽爽爽麻豆色哟哟 | 成人性生交大片| 另类综合日韩欧美亚洲| 亚洲国产欧美另类丝袜| 国产香蕉久久精品综合网| 欧美电影一区二区| 欧美视频一区二区在线观看| 岛国一区二区在线观看| 久久精品国产亚洲aⅴ| 日韩中文字幕亚洲一区二区va在线| 国产精品久久久久久久久搜平片 | 91在线观看一区二区| 精品一区二区成人精品| 日日摸夜夜添夜夜添精品视频| 悠悠色在线精品| 亚洲人成在线观看一区二区| 日本一区二区免费在线 | kk眼镜猥琐国模调教系列一区二区| 美腿丝袜亚洲色图| 日韩一区欧美二区| 午夜激情久久久| 婷婷综合五月天| 亚洲午夜久久久久| 亚洲国产精品久久人人爱蜜臀| 亚洲国产精品久久人人爱| 亚洲一区二区三区四区五区黄| 亚洲色图在线视频| 夜夜嗨av一区二区三区四季av| 亚洲人成精品久久久久久| 亚洲色图第一区| 亚洲另类春色国产| 亚洲永久免费视频| 视频一区视频二区中文字幕| 婷婷六月综合网| 蜜桃久久久久久久| 极品瑜伽女神91| 成人福利视频在线| 91成人看片片| 日韩一区二区中文字幕| 日韩欧美成人激情| 国产精品污www在线观看| 国产精品久久久久久久浪潮网站| 亚洲丝袜另类动漫二区| 亚洲一区二区三区激情| 亚洲电影你懂得| 韩日av一区二区| av不卡在线播放| 欧美伦理电影网| 久久你懂得1024| 一区二区欧美精品| 精品亚洲国产成人av制服丝袜| 国产风韵犹存在线视精品| 91蝌蚪porny| 欧美一区二区三区免费观看视频| 精品国产一区二区在线观看| 国产欧美一区二区精品性色超碰| 亚洲视频综合在线| 免费成人美女在线观看.| 国产成人av电影| 欧美日韩激情在线| 国产人久久人人人人爽| 一区二区三区在线视频观看| 麻豆极品一区二区三区| www.日韩av| 欧美mv和日韩mv国产网站| 一区二区三区在线观看视频| 欧美bbbbb| 欧美视频完全免费看| 久久久久久一二三区| 亚洲国产精品久久久久秋霞影院| 国产精品小仙女| 日韩欧美中文一区|