亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來(lái)到蟲(chóng)蟲(chóng)下載站! | ?? 資源下載 ?? 資源專(zhuān)輯 ?? 關(guān)于我們
? 蟲(chóng)蟲(chóng)下載站

?? html.pl

?? namazu. 雖然是日語(yǔ)的,也適用于文件中單詞索引后全文檢索.
?? PL
字號(hào):
## -*- Perl -*-# $Id: html.pl,v 1.32.4.2 2002/06/17 05:02:59 knok Exp $# Copyright (C) 1997-1999 Satoru Takabayashi All rights reserved.# Copyright (C) 2000 Namazu Project All rights reserved.#     This is free software with ABSOLUTELY NO WARRANTY.##  This program is free software; you can redistribute it and/or modify#  it under the terms of the GNU General Public License as published by#  the Free Software Foundation; either versions 2, or (at your option)#  any later version.# #  This program is distributed in the hope that it will be useful#  but WITHOUT ANY WARRANTY; without even the implied warranty of#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the#  GNU General Public License for more details.##  You should have received a copy of the GNU General Public License#  along with this program; if not, write to the Free Software#  Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA#  02111-1307, USA##  This file must be encoded in EUC-JP encoding#package html;use strict;require 'gfilter.pl';my $EMBEDDED_FILE = '\.(asp|jsp|php[3s]?|phtml)(?:\.gz)?';sub mediatype() {    return ('text/html');}sub status() {    return 'yes';}sub recursive() {    return 0;}sub pre_codeconv() {    return 1;}sub post_codeconv () {    return 0;}sub add_magic ($) {    return;}sub filter ($$$$$) {    my ($orig_cfile, $cont, $weighted_str, $headings, $fields)      = @_;    my $cfile = defined $orig_cfile ? $$orig_cfile : '';    util::vprint("Processing html file ...\n");    if ($var::Opt{'robotexclude'}) {	my $err = isexcluded($cont);	return $err if $err;    }    if ($cfile =~ /($EMBEDDED_FILE)$/o) {       embedded_filter($cont);    }    html_filter($cont, $weighted_str, $fields, $headings);        gfilter::line_adjust_filter($cont);    gfilter::line_adjust_filter($weighted_str);    gfilter::white_space_adjust_filter($cont);    gfilter::show_filter_debug_info($cont, $weighted_str,			   $fields, $headings);    return undef;}# Check wheter or not the given URI is excluded.sub isexcluded ($) {    my ($contref) = @_;    my $err = undef;    if ($$contref =~ /META\s+NAME\s*=\s*([\'\"]?)ROBOTS\1\s+[^>]*	CONTENT\s*=\s*([\'\"]?).*?(NOINDEX|NONE).*?\2[^>]*>/ix)  #"    {	$err = _("is excluded because of <meta name=\"robots\" ...>");    }    return $err;}sub html_filter ($$$$) {    my ($contref, $weighted_str, $fields, $headings) = @_;    html::escape_lt_gt($contref);    $fields->{'title'} = html::get_title($contref, $weighted_str);    html::get_author($contref, $fields);    html::get_meta_tags($contref, $weighted_str, $fields);    html::get_img_alt($contref);    html::get_table_summary($contref);    html::get_title_attr($contref);    html::normalize_html_element($contref);    html::erase_above_body($contref);    html::remove_comments($contref);    html::weight_element($contref, $weighted_str, $headings);    html::remove_html_elements($contref);    # restore entities of each content.    html::decode_entity($contref);    html::decode_entity($weighted_str);    html::decode_entity($headings);    for my $key (keys %{$fields}) {	html::decode_entity(\$fields->{$key});    }}# Get rid of HTML-embedded codessub embedded_filter ($) {    my ($contref) = @_;    # handle with ASP,JSP,PHP,VBScript,JScript and JavaScript.    $$contref =~ s/<%.*?%>//gs;    $$contref =~ s/<\?.*?\?>//gs;    $$contref =~ s/<asp:.*?\/>//gs;    $$contref =~ s/<jsp:.*?\/>//gs;    $$contref =~ s/<script.*>.*<\/script>//igs;}# Convert independent < > s into entity references for escaping.# Substitute twice for safe.sub escape_lt_gt ($) {    my ($contref) = @_;    $$contref =~ s/\s<\s/ &lt; /g;    $$contref =~ s/\s>\s/ &gt; /g;    $$contref =~ s/\s<\s/ &lt; /g;    $$contref =~ s/\s>\s/ &gt; /g;}sub get_author ($$) {    my ($contref, $fields) = @_;    # <LINK REV=MADE HREF="mailto:ccsatoru@vega.aichi-u.ac.jp">    if ($$contref =~ m!<LINK\s[^>]*?HREF=([\"\'])mailto:(.*?)\1\s*>!i) { #"	    $fields->{'author'} = $2;    } elsif ($$contref =~ m!.*<ADDRESS[^>]*>([^<]*?)</ADDRESS>!i) {	my $tmp = $1;#	$tmp =~ s/\s//g;	if ($tmp =~ /\b([\w\.\-]+\@[\w\.\-]+(?:\.[\w\.\-]+)+)\b/) {	    $fields->{'author'} = $1;	}    }}# Get title from <title>..</title># It's okay to exits two or more <title>...</TITLE>. # First one will be retrieved.sub get_title ($$) {    my ($contref, $weighted_str) = @_;    my $title = '';        if ($$contref =~ s!<TITLE[^>]*>([^<]+)</TITLE>!!i) {	$title = $1;	$title =~ s/\s+/ /g;	$title =~ s/^\s+//;	$title =~ s/\s+$//;	my $weight = $conf::Weight{'html'}->{'title'};	$$weighted_str .= "\x7f$weight\x7f$title\x7f/$weight\x7f\n";    } else {	$title = $conf::NO_TITLE;    }    return $title;}# get foo bar from <META NAME="keywords|description" CONTENT="foo bar"> sub get_meta_tags ($$$) {    my ($contref, $weighted_str, $fields) = @_;        # <meta name="keywords" content="foo bar baz">    my $weight = $conf::Weight{'metakey'};    $$weighted_str .= "\x7f$weight\x7f$3\x7f/$weight\x7f\n" 	if $$contref =~ /<meta\s+name\s*=\s*([\'\"]?) #"	    keywords\1\s+[^>]*content\s*=\s*([\'\"]?)([^>]*?)\2[^>]*>/ix; #"    # <meta name="description" content="foo bar baz">    $$weighted_str .= "\x7f$weight\x7f$3\x7f/$weight\x7f\n" 	if $$contref =~ /<meta\s+name\s*=\s*([\'\"]?)description #"	    \1\s+[^>]*content\s*=\s*([\'\"]?)([^>]*?)\2[^>]*>/ix; #"    if ($var::Opt{'meta'}) {	my @keys = split '\|', $conf::META_TAGS;	for my $key (@keys) {	    while ($$contref =~ /<meta\s+name\s*=\s*([\'\"]?)$key #"	       \1\s+[^>]*content\s*=\s*([\'\"]?)([^>]*?)\2[^>]*>/gix) 	    {		$fields->{$key} .= $3 . " ";	    }	    util::dprint("meta: $key: $fields->{$key}\n") 		if defined $fields->{$key};	}    }}# Get foo from <IMG ... ALT="foo"># It's not to handle HTML strictly.sub get_img_alt ($) {    my ($contref) = @_;    $$contref =~ s/<IMG[^>]*\s+ALT\s*=\s*[\"\']?([^\"\']*)[\"\']?[^>]*>/ $1 /gi; #"}# Get foo from <TABLE ... SUMMARY="foo">sub get_table_summary ($) {    my ($contref) = @_;    $$contref =~ s/<TABLE[^>]*\s+SUMMARY\s*=\s*[\"\']?([^\"\']*)[\"\']?[^>]*>/ $1 /gi; #"}# Get foo from <XXX ... TITLE="foo">sub get_title_attr ($) {    my ($contref) = @_;    $$contref =~ s/<[A-Z]+[^>]*\s+TITLE\s*=\s*[\"\']?([^\"\']*)[\"\']?[^>]*>/ $1 /gi; #"}# Normalize elements like: <A HREF...> -> <A>sub normalize_html_element ($) {    my ($contref) = @_;    $$contref =~ s/<([!\w]+)\s+[^>]*>/<$1>/g;}# Remove contents above <body>.sub erase_above_body ($) {    my ($contref) = @_;    $$contref =~ s/^.*<body>//is;}# remove all comments. it's not perfect but almost works.sub remove_comments ($) {    my ($contref) = @_;    # remove all comments    $$contref =~ s/<!--.*?-->//gs;}# Weight a score of a keyword in a given text using %conf::Weight hash.# This process make the text be surround by temporary tags # \x7fXX\x7f and \x7f/XX\x7f. XX represents score.# Sort keys of %conf::Weight for processing <a> first.# Because <a> has a tendency to be inside of other tags.# Thus, it does'not processing for nexted tags strictly.# Moreover, it does special processing for <h[1-6]> for summarization.sub weight_element ($$$ ) {    my ($contref, $weighted_str, $headings) = @_;    for my $element (sort keys(%{$conf::Weight{'html'}})) {	my $tmp = "";	$$contref =~ s!<($element)>(.*?)</$element>!weight_element_sub($1, $2, \$tmp)!gies;	$$headings .= $tmp if $element =~ /^H[1-6]$/i && ! $var::Opt{'noheadabst'} 	    && $tmp;	my $weight = $element =~ /^H[1-6]$/i && ! $var::Opt{'noheadabst'} ? 	    $conf::Weight{'html'}->{$element} : $conf::Weight{'html'}->{$element} - 1;	$$weighted_str .= "\x7f$weight\x7f$tmp\x7f/$weight\x7f\n" if $tmp;    }}sub weight_element_sub ($$$) {    my ($element, $text, $tmp) = @_;    my $space = element_space($element);    $text =~ s/<[^>]*>//g;    $$tmp .= "$text " if (length($text)) < $conf::INVALID_LENG;    $element =~ /^H[1-6]$/i && ! $var::Opt{'noheadabst'}  ? " " : "$space$text$space";}# determine whether a given element should be delete or be substituted with spacesub element_space ($) {    $_[0] =~ /^($conf::NON_SEPARATION_ELEMENTS)$/io ? "" : " ";}# remove all HTML elements. it's not perfect but almost works.sub remove_html_elements ($) {    my ($contref) = @_;    # remove all elements    $$contref =~ s!</?([A-Z]\w*)(?:\s+[A-Z]\w*(?:\s*=\s*(?:(["']).*?\2|[\w\-.]+))?)*\s*>!element_space($1)!gsixe;}# Decode a numberd entity. Exclude an invalid number.sub decode_numbered_entity ($) {    my ($num) = @_;    return ""	if $num >= 0 && $num <= 8 ||  $num >= 11 && $num <= 31 || $num >=127;    sprintf ("%c",$num);}# Decode an entity. Ignore characters of right half of ISO-8859-1.# Because it can't be handled in EUC encoding.# This function provides sequential entities like: &quot &lt &gt;sub decode_entity ($) {    my ($text) = @_;    return unless defined($$text);    $$text =~ s/&#(\d{2,3})[;\s]/decode_numbered_entity($1)/ge;    $$text =~ s/&#x([\da-f]+)[;\s]/decode_numbered_entity(hex($1))/gei;    $$text =~ s/&quot[;\s]/\"/g; #"    $$text =~ s/&amp[;\s]/&/g;    $$text =~ s/&lt[;\s]/</g;    $$text =~ s/&gt[;\s]/>/g;    $$text =~ s/&nbsp[;\s]/ /g;}# encode entities: only '<', '>', and '&'sub encode_entity ($) {    my ($tmp) = @_;    $$tmp =~ s/&/&amp;/g;    # &amp; should be processed first    $$tmp =~ s/</&lt;/g;    $$tmp =~ s/>/&gt;/g;    $$tmp;}1;

?? 快捷鍵說(shuō)明

復(fù)制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號(hào) Ctrl + =
減小字號(hào) Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
中文字幕不卡三区| 亚洲一区二区成人在线观看| 成人av中文字幕| 午夜天堂影视香蕉久久| 中文字幕欧美三区| 91精品国产手机| 波多野结衣一区二区三区 | 国产欧美日韩精品a在线观看| 色噜噜狠狠色综合欧洲selulu| 久草这里只有精品视频| 亚洲国产日日夜夜| 国产精品久久久久久久久免费桃花 | 99久久婷婷国产综合精品电影| 日韩在线观看一区二区| 国产精品白丝在线| 久久综合九色综合97_久久久 | 日韩一区二区三区免费看 | 另类小说一区二区三区| 亚洲国产日韩一区二区| 综合在线观看色| 中文久久乱码一区二区| 欧美精品一区二| 欧美一区二区三区播放老司机| 欧美做爰猛烈大尺度电影无法无天| 成人va在线观看| 国产米奇在线777精品观看| 美女网站色91| 青青草原综合久久大伊人精品优势| 一区二区三区免费在线观看| 亚洲免费观看在线观看| 亚洲视频一区在线观看| 中文字幕亚洲一区二区av在线| 久久久亚洲精品石原莉奈| 欧美mv和日韩mv的网站| 日韩免费一区二区三区在线播放| 7777精品伊人久久久大香线蕉经典版下载 | 欧美日韩精品一区二区天天拍小说 | 欧美一级淫片007| 亚洲桃色在线一区| 国产精品精品国产色婷婷| 26uuu亚洲| 久久久噜噜噜久久人人看| 国产午夜精品一区二区三区四区| 精品国产伦一区二区三区观看方式| 51精品秘密在线观看| 欧美一区二视频| 日韩三级精品电影久久久| 91精品国产色综合久久不卡电影| 7777女厕盗摄久久久| 日韩精品一区二区三区视频播放 | 国产美女精品一区二区三区| 国精产品一区一区三区mba桃花| 美女精品一区二区| 国产一区二区三区在线观看免费视频 | 国产精品网站在线观看| 中文字幕色av一区二区三区| 日韩伦理免费电影| 亚洲第一福利一区| 美日韩黄色大片| 国产v日产∨综合v精品视频| 99这里只有精品| 欧美丝袜丝交足nylons图片| 欧美一区二区久久| 久久综合网色—综合色88| 国产欧美精品一区| 一区二区三区日韩在线观看| 日韩电影在线免费观看| 福利电影一区二区| 欧美影视一区二区三区| 日韩欧美一区在线| 亚洲国产精品av| 亚洲国产日韩精品| 国产一区二区久久| a级高清视频欧美日韩| 欧美高清www午色夜在线视频| 26uuu成人网一区二区三区| 国产精品美女久久久久久久| 一区二区激情小说| 精品在线免费观看| 在线免费观看视频一区| 日韩欧美不卡一区| 中文字幕亚洲一区二区va在线| 天天综合网 天天综合色| 国产成人av一区二区| 在线观看视频一区| 国产午夜精品在线观看| 五月婷婷综合激情| 成a人片亚洲日本久久| 91精品国产色综合久久不卡蜜臀| 中文字幕欧美激情一区| 欧美aa在线视频| www.av亚洲| 精品国产污污免费网站入口 | 欧美久久一区二区| 国产精品欧美一区二区三区| 日本成人在线不卡视频| 亚洲精品在线免费观看视频| 中文字幕一区在线观看| 全国精品久久少妇| 在线观看视频一区| 国产精品欧美一级免费| 极品销魂美女一区二区三区| 欧美性大战久久久久久久| 国产精品色一区二区三区| 久久精品国产免费看久久精品| 91精品1区2区| 国产午夜精品理论片a级大结局 | 美女网站色91| 欧美影视一区在线| 日韩久久一区二区| 国产成人在线色| 日韩视频一区在线观看| 亚洲bt欧美bt精品| 色综合夜色一区| 国产精品你懂的在线欣赏| 韩国三级在线一区| 69p69国产精品| 亚洲一区二区三区爽爽爽爽爽 | 最新日韩av在线| 国产成人免费视| 久久久www成人免费无遮挡大片| 日韩国产精品久久| 欧美久久一二区| 亚洲国产一区视频| 91国偷自产一区二区开放时间| 中文字幕一区二区视频| 处破女av一区二区| 久久精品一区八戒影视| 国产一区二区三区久久悠悠色av| 欧美一个色资源| 日韩电影在线观看电影| 5月丁香婷婷综合| 日日夜夜免费精品视频| 欧美精品丝袜中出| 亚洲mv在线观看| 69成人精品免费视频| 日本aⅴ亚洲精品中文乱码| 欧美精品v国产精品v日韩精品| 亚州成人在线电影| 91麻豆精品91久久久久久清纯| 日韩中文字幕av电影| 日韩一级高清毛片| 国产揄拍国内精品对白| 国产亚洲精品7777| caoporm超碰国产精品| 亚洲人亚洲人成电影网站色| 91国产精品成人| 亚洲成在线观看| 欧美日韩精品欧美日韩精品一综合| 一区二区三区免费| 91精品国模一区二区三区| 麻豆中文一区二区| 国产亚洲精品aa| 91小视频在线| 首页国产丝袜综合| 欧美精品一区二区三区高清aⅴ| 国产一区二区在线观看免费| 亚洲国产精品国自产拍av| 91麻豆免费观看| 亚洲成av人片一区二区三区| 日韩你懂的电影在线观看| 丁香另类激情小说| 亚洲精品第一国产综合野| 欧美人与z0zoxxxx视频| 经典一区二区三区| 亚洲天堂成人网| 91精品国产手机| 大陆成人av片| 99国内精品久久| 亚洲成年人网站在线观看| 精品国产伦一区二区三区观看体验| 成人综合在线网站| 亚洲一区在线观看免费观看电影高清 | 制服视频三区第一页精品| 韩国精品在线观看| 亚洲免费视频成人| 精品国产亚洲一区二区三区在线观看| 成人免费视频免费观看| 亚洲一区在线观看免费观看电影高清| 日韩午夜在线播放| 一本久久a久久免费精品不卡| 日本中文在线一区| 亚洲情趣在线观看| 日韩美女天天操| 在线视频亚洲一区| 国产久卡久卡久卡久卡视频精品| 亚洲免费观看在线视频| 精品国产欧美一区二区| 在线免费观看一区| 国产成人精品一区二区三区四区| 亚洲亚洲精品在线观看| 国产精品三级视频| 欧美成人a∨高清免费观看| 91看片淫黄大片一级在线观看| 美国精品在线观看| 亚洲一二三专区| 欧美国产亚洲另类动漫| 欧美一级午夜免费电影| 在线观看中文字幕不卡| 国产91精品欧美|