source: gsdl/trunk/perllib/plugins/SourceCodePlugin.pm@ 15865

Last change on this file since 15865 was 15865, checked in by kjdon, 16 years ago

renaming plugins in preparation for my plugin overhaul

  • Property svn:executable set to *
  • Property svn:keywords set to Author Date Id Revision
File size: 7.0 KB
Line 
1###########################################################################
2#
3# SRCPlug.pm -- source code plugin
4#
5# A component of the Greenstone digital library software
6# from the New Zealand Digital Library Project at the
7# University of Waikato, New Zealand.
8#
9# Copyright (C) 1999 New Zealand Digital Library Project
10#
11# This program is free software; you can redistribute it and/or modify
12# it under the terms of the GNU General Public License as published by
13# the Free Software Foundation; either version 2 of the License, or
14# (at your option) any later version.
15#
16# This program is distributed in the hope that it will be useful,
17# but WITHOUT ANY WARRANTY; without even the implied warranty of
18# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
19# GNU General Public License for more details.
20#
21# You should have received a copy of the GNU General Public License
22# along with this program; if not, write to the Free Software
23# Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
24#
25###########################################################################
26# John McPherson Nov 2000
27# originally based on TEXTPlug
28
29# filename is currently used for Title ( optionally minus some prefix )
30
31# Current languages:
32# text: READMEs/Makefiles
33# C/C++ (currently extracts #include statements and C++ class decls)
34# Perl (currently only done as text)
35# Shell (currently only done as text)
36
37# 12/05/02 Added usage datastructure - John Thompson
38
39package SRCPlug;
40
41use BasPlug;
42
43use strict;
44no strict 'refs'; # allow filehandles to be variables and viceversa
45
46sub BEGIN {
47 @SRCPlug::ISA = ('BasPlug');
48}
49
50my $arguments =
51 [ { 'name' => "process_exp",
52 'desc' => "{BasPlug.process_exp}",
53 'type' => "regexp",
54 'deft' => &get_default_process_exp(),
55 'reqd' => "no" } ,
56 { 'name' => "block_exp",
57 'desc' => "{BasPlug.block_exp}",
58 'type' => "regexp",
59 'deft' => &get_default_block_exp(),
60 'reqd' => "no" },
61 { 'name' => "remove_prefix",
62 'desc' => "{SRCPlug.remove_prefix}",
63 'type' => "regexp",
64 'deft' => "^.*[/\\]",
65 'reqd' => "no" } ];
66
67my $options = { 'name' => "SRCPlug",
68 'desc' => "{SRCPlug.desc}",
69 'abstract' => "no",
70 'inherits' => "yes",
71 'args' => $arguments };
72
73
74sub new {
75 my ($class) = shift (@_);
76 my ($pluginlist,$inputargs,$hashArgOptLists) = @_;
77 push(@$pluginlist, $class);
78
79 if(defined $arguments){ push(@{$hashArgOptLists->{"ArgList"}},@{$arguments});}
80 if(defined $options) { push(@{$hashArgOptLists->{"OptList"}},$options)};
81
82 my $self = new BasPlug($pluginlist, $inputargs, $hashArgOptLists);
83
84 return bless $self, $class;
85}
86
87sub get_default_block_exp {
88 my $self = shift (@_);
89
90 return q^(?i)\.(o|obj|a|so|dll)$^;
91}
92
93sub get_default_process_exp {
94 my $self = shift (@_);
95
96# return q^(?i)\.te?xt$^;
97 return q^(Makefile.*|README.*|(?i)\.(c|cc|cpp|C|h|hpp|pl|pm|sh))$^;
98}
99
100
101
102# do plugin specific processing of doc_obj
103sub process {
104 my $self = shift (@_);
105 my ($textref, $pluginfo, $base_dir, $file, $metadata, $doc_obj, $gli) = @_;
106 my $outhandle = $self->{'outhandle'};
107
108 print STDERR "<Processing n='$file' p='SRCPlug'>\n" if ($gli);
109 print $outhandle "SRCPlug: processing $file\n"
110 if $self->{'verbosity'} > 1;
111
112 my $cursection = $doc_obj->get_top_section();
113
114 my $filetype="text"; # Makefiles, READMEs, ...
115 if ($file =~ /\.(cc|h|cpp|C)$/) {$filetype="C++";} # assume all .h files...
116 elsif ($file =~ /\.c$/) {$filetype="C";}
117 elsif ($file =~ /\.p(l|m)$/) {$filetype="perl";}
118 elsif ($file =~ /\.sh$/) {$filetype="sh";}
119
120 # modify '<' and '>' for GML... (even though inside <pre> tags!!)
121 $$textref =~ s/</&lt;/g;
122 $$textref =~ s/>/&gt;/g;
123 $$textref =~ s/_/&#95;/g;
124 # try _escape_text($text) from doc.pm....
125
126 # don't want mg to turn escape chars into actual values
127 $$textref =~ s/\\/\\\\/g;
128
129 # use filename (minus any prefix) as the title.
130 my $title;
131 if ($self->{'remove_prefix' ne ""}) {
132 ($title = $file) =~ s/^$self->{'remove_prefix'}//;
133 } else {
134 ($title = $file) =~ s@^.*[/\\]@@; # remove pathname by default
135 }
136 $doc_obj->add_utf8_metadata ($cursection, "Title", $title);
137 $doc_obj->add_metadata ($cursection, "FileFormat", "SRC");
138
139 # remove the gsdl prefix from the filename
140 my $relative_filename=$file;
141 $relative_filename =~ s@^.*?gsdl[/\\]@@;
142 $doc_obj->add_utf8_metadata ($cursection, "filename", $relative_filename);
143
144 # class information from .h and .cc and .C and .cpp files
145 if ($filetype eq "C++")
146 {
147 process_c_plus_plus($textref,$pluginfo, $base_dir,
148 $file, $metadata, $doc_obj);
149 } elsif ($filetype eq "C")
150 {
151 get_includes_metadata($textref, $doc_obj);
152 }
153
154
155 # default operation...
156 # insert preformat tags and add text to document object
157 $doc_obj->add_utf8_text($cursection, "<pre>\n$$textref\n</pre>");
158
159 return 1;
160}
161
162
163
164
165sub get_includes_metadata {
166 my ($textref, $doc_obj) = @_;
167
168 my $topsection = $doc_obj->get_top_section();
169
170 # Get '#include' directives for metadata
171 if ($$textref !~ /\#\s*include\b/) {
172 return;
173 }
174
175 my @includes =
176 ($$textref =~ m/^\s*\#\s*include\s*(?:\"|&lt;)(.*?)(?:\"|&gt;)/mg);
177
178 my $incs_done_ref=$doc_obj->get_metadata($topsection, "includes");
179 my @incs_done;
180 if (defined($incs_done_ref)) {
181 @incs_done=@$incs_done_ref;
182 } else {
183 @incs_done=();
184 }
185
186 foreach my $inc (@includes) {
187 # add entries, but only if they don't already exist
188 if (!join('', map {$_ eq "$inc"?1:""} @incs_done)) {
189 push @incs_done, $inc;
190 $doc_obj->add_utf8_metadata($topsection, "includes", $inc);
191 }
192 }
193}
194
195
196
197sub process_c_plus_plus {
198 my ($textref, $pluginfo, $base_dir, $file, $metadata, $doc_obj) = @_;
199
200 my $topsection = $doc_obj->get_top_section();
201
202
203 # Check for include metadata
204 get_includes_metadata($textref, $doc_obj);
205
206
207
208 # Get class declarations (but not forward declarations...) as metadata
209 if ($$textref =~ /\bclass\b/ ) {
210 my $classnames=$$textref;
211
212 # remove commented lines
213 $classnames =~ s@/\*.*?\*/@@sg;
214 $classnames =~ s@//.*$@@mg;
215 while ($classnames =~ /\bclass\b/) {
216
217 # delete all lines up to the next "class"
218 while ($classnames !~ /^[^\n]*\bclass\b[^\n]*\n/)
219 {$classnames =~ s/.*\n//;}
220
221# $classnames =~ s/^([^c][^l])*(.)?$//mg; # delete unneccessary lines
222
223 # get the line including the next "class" and remove it from
224 # our tmp text.
225 $classnames =~ s/^(.*\bclass\b.*)$//m;
226
227 # don't index if merely a reference/fwd decl. of another class
228 if ($1 !~ /(friend\Wclass)|(class\W\w+\W?\;)|(\/\/.*class)/) {
229 # $1 is still the whole line - eg:
230 # "class StaffSystem: public BaseStaffSystem"
231 my $wholeline=$1;
232 my $classname=$1;
233 $classname =~ s/.*class\W(\w+).*/$1/;
234 my $classes=$doc_obj->get_metadata($topsection, "class");
235 foreach my $elem (@$classes) {
236 if ("$elem" eq "$classname") {goto class_done;}
237 }
238 $doc_obj->add_utf8_metadata($topsection, "class", $classname);
239 class_done:
240 $doc_obj->add_utf8_metadata($topsection, "classdecl", $wholeline);
241 }
242 }
243 } # end of "class"
244
245 return 1;
246}
247
2481;
249
Note: See TracBrowser for help on using the repository browser.