Source code of Windows XP (NT5)
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

392 lines
9.7 KiB

  1. package B::Xref;
  2. =head1 NAME
  3. B::Xref - Generates cross reference reports for Perl programs
  4. =head1 SYNOPSIS
  5. perl -MO=Xref[,OPTIONS] foo.pl
  6. =head1 DESCRIPTION
  7. The B::Xref module is used to generate a cross reference listing of all
  8. definitions and uses of variables, subroutines and formats in a Perl program.
  9. It is implemented as a backend for the Perl compiler.
  10. The report generated is in the following format:
  11. File filename1
  12. Subroutine subname1
  13. Package package1
  14. object1 C<line numbers>
  15. object2 C<line numbers>
  16. ...
  17. Package package2
  18. ...
  19. Each B<File> section reports on a single file. Each B<Subroutine> section
  20. reports on a single subroutine apart from the special cases
  21. "(definitions)" and "(main)". These report, respectively, on subroutine
  22. definitions found by the initial symbol table walk and on the main part of
  23. the program or module external to all subroutines.
  24. The report is then grouped by the B<Package> of each variable,
  25. subroutine or format with the special case "(lexicals)" meaning
  26. lexical variables. Each B<object> name (implicitly qualified by its
  27. containing B<Package>) includes its type character(s) at the beginning
  28. where possible. Lexical variables are easier to track and even
  29. included dereferencing information where possible.
  30. The C<line numbers> are a comma separated list of line numbers (some
  31. preceded by code letters) where that object is used in some way.
  32. Simple uses aren't preceded by a code letter. Introductions (such as
  33. where a lexical is first defined with C<my>) are indicated with the
  34. letter "i". Subroutine and method calls are indicated by the character
  35. "&". Subroutine definitions are indicated by "s" and format
  36. definitions by "f".
  37. =head1 OPTIONS
  38. Option words are separated by commas (not whitespace) and follow the
  39. usual conventions of compiler backend options.
  40. =over 8
  41. =item C<-oFILENAME>
  42. Directs output to C<FILENAME> instead of standard output.
  43. =item C<-r>
  44. Raw output. Instead of producing a human-readable report, outputs a line
  45. in machine-readable form for each definition/use of a variable/sub/format.
  46. =item C<-D[tO]>
  47. (Internal) debug options, probably only useful if C<-r> included.
  48. The C<t> option prints the object on the top of the stack as it's
  49. being tracked. The C<O> option prints each operator as it's being
  50. processed in the execution order of the program.
  51. =back
  52. =head1 BUGS
  53. Non-lexical variables are quite difficult to track through a program.
  54. Sometimes the type of a non-lexical variable's use is impossible to
  55. determine. Introductions of non-lexical non-scalars don't seem to be
  56. reported properly.
  57. =head1 AUTHOR
  58. Malcolm Beattie, mbeattie@sable.ox.ac.uk.
  59. =cut
  60. use strict;
  61. use B qw(peekop class comppadlist main_start svref_2object walksymtable);
  62. # Constants (should probably be elsewhere)
  63. sub OPpLVAL_INTRO () { 128 }
  64. sub SVf_POK () { 0x40000 }
  65. sub UNKNOWN { ["?", "?", "?"] }
  66. my @pad; # lexicals in current pad
  67. # as ["(lexical)", type, name]
  68. my %done; # keyed by $$op: set when each $op is done
  69. my $top = UNKNOWN; # shadows top element of stack as
  70. # [pack, type, name] (pack can be "(lexical)")
  71. my $file; # shadows current filename
  72. my $line; # shadows current line number
  73. my $subname; # shadows current sub name
  74. my %table; # Multi-level hash to record all uses etc.
  75. my @todo = (); # List of CVs that need processing
  76. my %code = (intro => "i", used => "",
  77. subdef => "s", subused => "&",
  78. formdef => "f", meth => "->");
  79. # Options
  80. my ($debug_op, $debug_top, $nodefs, $raw);
  81. sub process {
  82. my ($var, $event) = @_;
  83. my ($pack, $type, $name) = @$var;
  84. if ($type eq "*") {
  85. if ($event eq "used") {
  86. return;
  87. } elsif ($event eq "subused") {
  88. $type = "&";
  89. }
  90. }
  91. $type =~ s/(.)\*$/$1/g;
  92. if ($raw) {
  93. printf "%-16s %-12s %5d %-12s %4s %-16s %s\n",
  94. $file, $subname, $line, $pack, $type, $name, $event;
  95. } else {
  96. # Wheee
  97. push(@{$table{$file}->{$subname}->{$pack}->{$type.$name}->{$event}},
  98. $line);
  99. }
  100. }
  101. sub load_pad {
  102. my $padlist = shift;
  103. my ($namelistav, @namelist, $ix);
  104. @pad = ();
  105. return if class($padlist) eq "SPECIAL";
  106. ($namelistav) = $padlist->ARRAY;
  107. @namelist = $namelistav->ARRAY;
  108. for ($ix = 1; $ix < @namelist; $ix++) {
  109. my $namesv = $namelist[$ix];
  110. next if class($namesv) eq "SPECIAL";
  111. my ($type, $name) = $namesv->PV =~ /^(.)(.*)$/;
  112. $pad[$ix] = ["(lexical)", $type, $name];
  113. }
  114. }
  115. sub xref {
  116. my $start = shift;
  117. my $op;
  118. for ($op = $start; $$op; $op = $op->next) {
  119. last if $done{$$op}++;
  120. warn sprintf("top = [%s, %s, %s]\n", @$top) if $debug_top;
  121. warn peekop($op), "\n" if $debug_op;
  122. my $ppname = $op->ppaddr;
  123. if ($ppname =~ /^pp_(or|and|mapwhile|grepwhile)$/) {
  124. xref($op->other);
  125. } elsif ($ppname eq "pp_match" || $ppname eq "pp_subst") {
  126. xref($op->pmreplstart);
  127. } elsif ($ppname eq "pp_substcont") {
  128. xref($op->other->pmreplstart);
  129. $op = $op->other;
  130. redo;
  131. } elsif ($ppname eq "pp_cond_expr") {
  132. # pp_cond_expr never returns op_next
  133. xref($op->true);
  134. $op = $op->false;
  135. redo;
  136. } elsif ($ppname eq "pp_enterloop") {
  137. xref($op->redoop);
  138. xref($op->nextop);
  139. xref($op->lastop);
  140. } elsif ($ppname eq "pp_subst") {
  141. xref($op->pmreplstart);
  142. } else {
  143. no strict 'refs';
  144. &$ppname($op) if defined(&$ppname);
  145. }
  146. }
  147. }
  148. sub xref_cv {
  149. my $cv = shift;
  150. my $pack = $cv->GV->STASH->NAME;
  151. $subname = ($pack eq "main" ? "" : "$pack\::") . $cv->GV->NAME;
  152. load_pad($cv->PADLIST);
  153. xref($cv->START);
  154. $subname = "(main)";
  155. }
  156. sub xref_object {
  157. my $cvref = shift;
  158. xref_cv(svref_2object($cvref));
  159. }
  160. sub xref_main {
  161. $subname = "(main)";
  162. load_pad(comppadlist);
  163. xref(main_start);
  164. while (@todo) {
  165. xref_cv(shift @todo);
  166. }
  167. }
  168. sub pp_nextstate {
  169. my $op = shift;
  170. $file = $op->filegv->SV->PV;
  171. $line = $op->line;
  172. $top = UNKNOWN;
  173. }
  174. sub pp_padsv {
  175. my $op = shift;
  176. $top = $pad[$op->targ];
  177. process($top, $op->private & OPpLVAL_INTRO ? "intro" : "used");
  178. }
  179. sub pp_padav { pp_padsv(@_) }
  180. sub pp_padhv { pp_padsv(@_) }
  181. sub deref {
  182. my ($var, $as) = @_;
  183. $var->[1] = $as . $var->[1];
  184. process($var, "used");
  185. }
  186. sub pp_rv2cv { deref($top, "&"); }
  187. sub pp_rv2hv { deref($top, "%"); }
  188. sub pp_rv2sv { deref($top, "\$"); }
  189. sub pp_rv2av { deref($top, "\@"); }
  190. sub pp_rv2gv { deref($top, "*"); }
  191. sub pp_gvsv {
  192. my $op = shift;
  193. my $gv = $op->gv;
  194. $top = [$gv->STASH->NAME, '$', $gv->NAME];
  195. process($top, $op->private & OPpLVAL_INTRO ? "intro" : "used");
  196. }
  197. sub pp_gv {
  198. my $op = shift;
  199. my $gv = $op->gv;
  200. $top = [$gv->STASH->NAME, "*", $gv->NAME];
  201. process($top, $op->private & OPpLVAL_INTRO ? "intro" : "used");
  202. }
  203. sub pp_const {
  204. my $op = shift;
  205. my $sv = $op->sv;
  206. $top = ["?", "",
  207. (class($sv) ne "SPECIAL" && $sv->FLAGS & SVf_POK) ? $sv->PV : "?"];
  208. }
  209. sub pp_method {
  210. my $op = shift;
  211. $top = ["(method)", "->".$top->[1], $top->[2]];
  212. }
  213. sub pp_entersub {
  214. my $op = shift;
  215. if ($top->[1] eq "m") {
  216. process($top, "meth");
  217. } else {
  218. process($top, "subused");
  219. }
  220. $top = UNKNOWN;
  221. }
  222. #
  223. # Stuff for cross referencing definitions of variables and subs
  224. #
  225. sub B::GV::xref {
  226. my $gv = shift;
  227. my $cv = $gv->CV;
  228. if ($$cv) {
  229. #return if $done{$$cv}++;
  230. $file = $gv->FILEGV->SV->PV;
  231. $line = $gv->LINE;
  232. process([$gv->STASH->NAME, "&", $gv->NAME], "subdef");
  233. push(@todo, $cv);
  234. }
  235. my $form = $gv->FORM;
  236. if ($$form) {
  237. return if $done{$$form}++;
  238. $file = $gv->FILEGV->SV->PV;
  239. $line = $gv->LINE;
  240. process([$gv->STASH->NAME, "", $gv->NAME], "formdef");
  241. }
  242. }
  243. sub xref_definitions {
  244. my ($pack, %exclude);
  245. return if $nodefs;
  246. $subname = "(definitions)";
  247. foreach $pack (qw(B O AutoLoader DynaLoader Config DB VMS
  248. strict vars FileHandle Exporter Carp)) {
  249. $exclude{$pack."::"} = 1;
  250. }
  251. no strict qw(vars refs);
  252. walksymtable(\%{"main::"}, "xref", sub { !defined($exclude{$_[0]}) });
  253. }
  254. sub output {
  255. return if $raw;
  256. my ($file, $subname, $pack, $name, $ev, $perfile, $persubname,
  257. $perpack, $pername, $perev);
  258. foreach $file (sort(keys(%table))) {
  259. $perfile = $table{$file};
  260. print "File $file\n";
  261. foreach $subname (sort(keys(%$perfile))) {
  262. $persubname = $perfile->{$subname};
  263. print " Subroutine $subname\n";
  264. foreach $pack (sort(keys(%$persubname))) {
  265. $perpack = $persubname->{$pack};
  266. print " Package $pack\n";
  267. foreach $name (sort(keys(%$perpack))) {
  268. $pername = $perpack->{$name};
  269. my @lines;
  270. foreach $ev (qw(intro formdef subdef meth subused used)) {
  271. $perev = $pername->{$ev};
  272. if (defined($perev) && @$perev) {
  273. my $code = $code{$ev};
  274. push(@lines, map("$code$_", @$perev));
  275. }
  276. }
  277. printf " %-16s %s\n", $name, join(", ", @lines);
  278. }
  279. }
  280. }
  281. }
  282. }
  283. sub compile {
  284. my @options = @_;
  285. my ($option, $opt, $arg);
  286. OPTION:
  287. while ($option = shift @options) {
  288. if ($option =~ /^-(.)(.*)/) {
  289. $opt = $1;
  290. $arg = $2;
  291. } else {
  292. unshift @options, $option;
  293. last OPTION;
  294. }
  295. if ($opt eq "-" && $arg eq "-") {
  296. shift @options;
  297. last OPTION;
  298. } elsif ($opt eq "o") {
  299. $arg ||= shift @options;
  300. open(STDOUT, ">$arg") or return "$arg: $!\n";
  301. } elsif ($opt eq "d") {
  302. $nodefs = 1;
  303. } elsif ($opt eq "r") {
  304. $raw = 1;
  305. } elsif ($opt eq "D") {
  306. $arg ||= shift @options;
  307. foreach $arg (split(//, $arg)) {
  308. if ($arg eq "o") {
  309. B->debug(1);
  310. } elsif ($arg eq "O") {
  311. $debug_op = 1;
  312. } elsif ($arg eq "t") {
  313. $debug_top = 1;
  314. }
  315. }
  316. }
  317. }
  318. if (@options) {
  319. return sub {
  320. my $objname;
  321. xref_definitions();
  322. foreach $objname (@options) {
  323. $objname = "main::$objname" unless $objname =~ /::/;
  324. eval "xref_object(\\&$objname)";
  325. die "xref_object(\\&$objname) failed: $@" if $@;
  326. }
  327. output();
  328. }
  329. } else {
  330. return sub {
  331. xref_definitions();
  332. xref_main();
  333. output();
  334. }
  335. }
  336. }
  337. 1;