/usr/share/namazu/filter/rfc.pl is in namazu2-index-tools 2.0.21-9.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 | #
# -*- Perl -*-
# $Id: rfc.pl,v 1.17.8.1 2007-01-14 04:12:04 opengl2772 Exp $
# Copyright (C) 1997-2000 Satoru Takabayashi ,
# 1999 NOKUBI Takatsugu All rights reserved.
# 2000-2007 Namazu Project All rights reserved.
# This is free software with ABSOLUTELY NO WARRANTY.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either versions 2, or (at your option)
# any later version.
#
# This program is distributed in the hope that it will be useful
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA
# 02111-1307, USA
#
# This file must be encoded in EUC-JP encoding
#
package rfc;
use strict;
require 'util.pl';
require 'gfilter.pl';
sub mediatype() {
return ('text/plain; x-type=rfc');
}
sub status() {
return 'yes';
}
sub recursive() {
return 0;
}
sub pre_codeconv() {
return 1; # For translated documents.
}
sub post_codeconv () {
return 0;
}
sub add_magic ($) {
my ($magic) = @_;
$magic->addSpecials("text/plain; x-type=rfc",
"^Network Working Group",
"^Request [fF]or Comments",
"^Obsoletes:",
"^Category:",
"^Updates:");
# FIXME: very ad hoc.
$magic->addFileExts('^rfc\d+\.txt$', 'text/plain; x-type=rfc');
$magic->addFileExts('^draft-(\w*-)+-\d+\.txt$', 'text/plain; x-type=internet-draft');
$magic->addFileExts('^fyi\d+\.txt$' => 'text/plain; x-type=fyi');
return;
}
sub filter ($$$$$) {
my ($orig_cfile, $cont, $weighted_str, $headings, $fields)
= @_;
my $cfile = defined $orig_cfile ? $$orig_cfile : '';
util::vprint("Processing rfc file ...\n");
rfc_filter($cont, $weighted_str, $fields);
gfilter::line_adjust_filter($cont);
gfilter::line_adjust_filter($weighted_str);
gfilter::white_space_adjust_filter($cont);
gfilter::show_filter_debug_info($cont, $weighted_str,
$fields, $headings);
return undef;
}
# It's not perfect because of fuzziness in RFC documents.
sub rfc_filter ($$$) {
my ($contref, $weighted_str, $fields) = @_;
$$contref =~ s/^\s+//s;
# Get an author name first.
if ($$contref =~ /^Network Working Group\s+(\S.*\S)\s*$/m) {
$fields->{'author'} = $1;
}
# Handle the header.
if ($$contref =~ s/((.+\n)+)\s+(.*)//) {
$$weighted_str .= "\x7f1\x7f$1\x7f/1\x7f\n" if defined $1;
# Get the title.
my $title = $3 if defined $3;
$fields->{'title'} = $title;
my $weight = $conf::Weight{'html'}->{'title'};
$$weighted_str .= "\x7f$weight\x7f$title\x7f/$weight\x7f\n";
}
# Get Summary or Introduction and put it at the beginning
# for summarization.
# $$contref =~ s/\A(.+?^(\d+\.\s*)?(Abstract|Introduction)\n\n)//ims;
$$contref =~ s/([\s\S]+^(\d+\.\s*)?(Abstract|Introduction)\n\n)//im;
$$weighted_str .= "\x7f1\x7f$1\x7f/1\x7f\n" if defined $1;
}
1;
|