merge: use refresh_and_write_cache
[git/git.git] / gitweb / gitweb.perl
CommitLineData
161332a5
KS
1#!/usr/bin/perl
2
c994d620 3# gitweb - simple web interface to track changes in git repositories
22fafb99 4#
00cd0794
KS
5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6# (C) 2005, Christian Gierke
823d5dc8 7#
d8f1c5c2 8# This program is licensed under the GPLv2
161332a5 9
d48b2841 10use 5.008;
161332a5
KS
11use strict;
12use warnings;
411ddf9e
GC
13# handle ACL in file access tests
14use filetest 'access';
19806691 15use CGI qw(:standard :escapeHTML -nosticky);
7403d50b 16use CGI::Util qw(unescape);
7a597457 17use CGI::Carp qw(fatalsToBrowser set_message);
40c13813 18use Encode;
b87d78d6 19use Fcntl ':mode';
7a13b999 20use File::Find qw();
cb9c6e5b 21use File::Basename qw(basename);
3962f1d7 22use Time::HiRes qw(gettimeofday tv_interval);
7d5b30e0
ÆAB
23use Digest::MD5 qw(md5_hex);
24
10bb9036 25binmode STDOUT, ':utf8';
161332a5 26
13dbf46a
JK
27if (!defined($CGI::VERSION) || $CGI::VERSION < 4.08) {
28 eval 'sub CGI::multi_param { CGI::param(@_) }'
29}
30
3962f1d7 31our $t0 = [ gettimeofday() ];
aa7dd05e
JN
32our $number_of_git_cmds = 0;
33
b1f5f64f 34BEGIN {
3be8e720 35 CGI->compile() if $ENV{'MOD_PERL'};
b1f5f64f
JN
36}
37
06c084d2 38our $version = "++GIT_VERSION++";
3e029299 39
c2394fe9
JN
40our ($my_url, $my_uri, $base_url, $path_info, $home_link);
41sub evaluate_uri {
42 our $cgi;
81d3fe9f 43
c2394fe9
JN
44 our $my_url = $cgi->url();
45 our $my_uri = $cgi->url(-absolute => 1);
46
47 # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
48 # needed and used only for URLs with nonempty PATH_INFO
49 our $base_url = $my_url;
50
51 # When the script is used as DirectoryIndex, the URL does not contain the name
52 # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
53 # have to do it ourselves. We make $path_info global because it's also used
54 # later on.
55 #
56 # Another issue with the script being the DirectoryIndex is that the resulting
57 # $my_url data is not the full script URL: this is good, because we want
58 # generated links to keep implying the script name if it wasn't explicitly
59 # indicated in the URL we're handling, but it means that $my_url cannot be used
60 # as base URL.
61 # Therefore, if we needed to strip PATH_INFO, then we know that we have
62 # to build the base URL ourselves:
84d9e2d5 63 our $path_info = decode_utf8($ENV{"PATH_INFO"});
c2394fe9 64 if ($path_info) {
cacfc09b
JS
65 # $path_info has already been URL-decoded by the web server, but
66 # $my_url and $my_uri have not. URL-decode them so we can properly
67 # strip $path_info.
68 $my_url = unescape($my_url);
69 $my_uri = unescape($my_uri);
c2394fe9
JN
70 if ($my_url =~ s,\Q$path_info\E$,, &&
71 $my_uri =~ s,\Q$path_info\E$,, &&
72 defined $ENV{'SCRIPT_NAME'}) {
73 $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
74 }
81d3fe9f 75 }
c2394fe9
JN
76
77 # target of the home link on top of all pages
78 our $home_link = $my_uri || "/";
b65910fe
GB
79}
80
e130ddaa
AT
81# core git executable to use
82# this can just be "git" if your webserver has a sensible PATH
06c084d2 83our $GIT = "++GIT_BINDIR++/git";
3f7f2710 84
b87d78d6 85# absolute fs-path which will be prepended to the project path
4a87b43e 86#our $projectroot = "/pub/scm";
06c084d2 87our $projectroot = "++GITWEB_PROJECTROOT++";
b87d78d6 88
ca5e9495
LL
89# fs traversing limit for getting project list
90# the number is relative to the projectroot
91our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
92
2de21fac
YS
93# string of the home link on top of all pages
94our $home_link_str = "++GITWEB_HOME_LINK_STR++";
95
ad9c2e22
TF
96# extra breadcrumbs preceding the home link
97our @extra_breadcrumbs = ();
98
49da1daf
AT
99# name of your site or organization to appear in page titles
100# replace this with something more descriptive for clearer bookmarks
8be2890c
PB
101our $site_name = "++GITWEB_SITENAME++"
102 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
49da1daf 103
c1355b7f
LH
104# html snippet to include in the <head> section of each page
105our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
b2d3476e
AC
106# filename of html text to include at top of each page
107our $site_header = "++GITWEB_SITE_HEADER++";
8ab1da2c 108# html text to include at home page
06c084d2 109our $home_text = "++GITWEB_HOMETEXT++";
b2d3476e
AC
110# filename of html text to include at bottom of each page
111our $site_footer = "++GITWEB_SITE_FOOTER++";
112
113# URI of stylesheets
114our @stylesheets = ("++GITWEB_CSS++");
887a612f
PB
115# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
116our $stylesheet = undef;
9a7a62ff 117# URI of GIT logo (72x27 size)
06c084d2 118our $logo = "++GITWEB_LOGO++";
0b5deba1
JN
119# URI of GIT favicon, assumed to be image/png type
120our $favicon = "++GITWEB_FAVICON++";
4af819d4
JN
121# URI of gitweb.js (JavaScript code for gitweb)
122our $javascript = "++GITWEB_JS++";
aedd9425 123
9a7a62ff
JN
124# URI and label (title) of GIT logo link
125#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
126#our $logo_label = "git documentation";
69fb8283 127our $logo_url = "http://git-scm.com/";
9a7a62ff 128our $logo_label = "git homepage";
51a7c66a 129
09bd7898 130# source of projects list
06c084d2 131our $projects_list = "++GITWEB_LIST++";
b87d78d6 132
55feb120
MH
133# the width (in characters) of the projects list "Description" column
134our $projects_list_description_width = 25;
135
d940c901
SC
136# group projects by category on the projects list
137# (enabled if this variable evaluates to true)
138our $projects_list_group_categories = 0;
139
140# default category if none specified
141# (leave the empty string for no category)
142our $project_list_default_category = "";
143
b06dcf8c
FL
144# default order of projects list
145# valid values are none, project, descr, owner, and age
146our $default_projects_order = "project";
147
32f4aacc
ML
148# show repository only if this file exists
149# (only effective if this variable evaluates to true)
150our $export_ok = "++GITWEB_EXPORT_OK++";
151
5710be46
KK
152# don't generate age column on the projects list page
153our $omit_age_column = 0;
154
0ebe7827
KK
155# don't generate information about owners of repositories
156our $omit_owner=0;
157
dd7f5f10
AG
158# show repository only if this subroutine returns true
159# when given the path to the project, for example:
160# sub { return -e "$_[0]/git-daemon-export-ok"; }
161our $export_auth_hook = undef;
162
32f4aacc
ML
163# only allow viewing of repositories also shown on the overview page
164our $strict_export = "++GITWEB_STRICT_EXPORT++";
165
19a8721e
JN
166# list of git base URLs used for URL to where fetch project from,
167# i.e. full URL is "$git_base_url/$project"
d6b7e0b9 168our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
19a8721e 169
f5aa79d9 170# default blob_plain mimetype and default charset for text/plain blob
4a87b43e
DS
171our $default_blob_plain_mimetype = 'text/plain';
172our $default_text_plain_charset = undef;
f5aa79d9 173
2d007374
PB
174# file to use for guessing MIME types before trying /etc/mime.types
175# (relative to the current git repository)
4a87b43e 176our $mimetypes_file = undef;
2d007374 177
00f429af
MK
178# assume this charset if line contains non-UTF-8 characters;
179# it should be valid encoding (see Encoding::Supported(3pm) for list),
180# for which encoding all byte sequences are valid, for example
181# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
182# could be even 'utf-8' for the old behavior)
183our $fallback_encoding = 'latin1';
184
69a9b41c
JN
185# rename detection options for git-diff and git-diff-tree
186# - default is '-M', with the cost proportional to
187# (number of removed files) * (number of new files).
188# - more costly is '-C' (which implies '-M'), with the cost proportional to
189# (number of changed files + number of removed files) * (number of new files)
190# - even more costly is '-C', '--find-copies-harder' with cost
191# (number of files in the original tree) * (number of new files)
192# - one might want to include '-B' option, e.g. '-B', '-M'
193our @diff_opts = ('-M'); # taken from git_commit
194
7e1100e9
MM
195# Disables features that would allow repository owners to inject script into
196# the gitweb domain.
197our $prevent_xss = 0;
198
7ce896b3
CW
199# Path to the highlight executable to use (must be the one from
200# http://www.andre-simon.de due to assumptions about parameters and output).
201# Useful if highlight is not installed on your webserver's PATH.
202# [Default: highlight]
203our $highlight_bin = "++HIGHLIGHT_BIN++";
204
a3c8ab30
MM
205# information about snapshot formats that gitweb is capable of serving
206our %known_snapshot_formats = (
207 # name => {
208 # 'display' => display name,
209 # 'type' => mime type,
210 # 'suffix' => filename suffix,
211 # 'format' => --format for git-archive,
212 # 'compressor' => [compressor command and arguments]
1bfd3631
MR
213 # (array reference, optional)
214 # 'disabled' => boolean (optional)}
a3c8ab30
MM
215 #
216 'tgz' => {
217 'display' => 'tar.gz',
218 'type' => 'application/x-gzip',
219 'suffix' => '.tar.gz',
220 'format' => 'tar',
0c8c385e 221 'compressor' => ['gzip', '-n']},
a3c8ab30
MM
222
223 'tbz2' => {
224 'display' => 'tar.bz2',
225 'type' => 'application/x-bzip2',
226 'suffix' => '.tar.bz2',
227 'format' => 'tar',
228 'compressor' => ['bzip2']},
229
cbdefb5a
MR
230 'txz' => {
231 'display' => 'tar.xz',
232 'type' => 'application/x-xz',
233 'suffix' => '.tar.xz',
234 'format' => 'tar',
235 'compressor' => ['xz'],
236 'disabled' => 1},
237
a3c8ab30
MM
238 'zip' => {
239 'display' => 'zip',
240 'type' => 'application/x-zip',
241 'suffix' => '.zip',
242 'format' => 'zip'},
243);
244
245# Aliases so we understand old gitweb.snapshot values in repository
246# configuration.
247our %known_snapshot_format_aliases = (
248 'gzip' => 'tgz',
249 'bzip2' => 'tbz2',
cbdefb5a 250 'xz' => 'txz',
a3c8ab30
MM
251
252 # backward compatibility: legacy gitweb config support
253 'x-gzip' => undef, 'gz' => undef,
254 'x-bzip2' => undef, 'bz2' => undef,
255 'x-zip' => undef, '' => undef,
256);
257
e9fdd74e
GB
258# Pixel sizes for icons and avatars. If the default font sizes or lineheights
259# are changed, it may be appropriate to change these values too via
260# $GITWEB_CONFIG.
261our %avatar_size = (
262 'default' => 16,
263 'double' => 32
264);
265
b62a1a98
JWH
266# Used to set the maximum load that we will still respond to gitweb queries.
267# If server load exceed this value then return "503 server busy" error.
268# If gitweb cannot determined server load, it is taken to be 0.
269# Leave it undefined (or set to 'undef') to turn off load checking.
270our $maxload = 300;
271
61bf126e
AS
272# configuration for 'highlight' (http://www.andre-simon.de/)
273# match by basename
274our %highlight_basename = (
275 #'Program' => 'py',
276 #'Library' => 'py',
277 'SConstruct' => 'py', # SCons equivalent of Makefile
278 'Makefile' => 'make',
279);
280# match by extension
281our %highlight_ext = (
282 # main extensions, defining name of syntax;
283 # see files in /usr/share/highlight/langDefs/ directory
048b3991 284 (map { $_ => $_ } qw(py rb java css js tex bib xml awk bat ini spec tcl sql)),
61bf126e 285 # alternate extensions, see /etc/highlight/filetypes.conf
048b3991
RH
286 (map { $_ => 'c' } qw(c h)),
287 (map { $_ => 'sh' } qw(sh bash zsh ksh)),
288 (map { $_ => 'cpp' } qw(cpp cxx c++ cc)),
289 (map { $_ => 'php' } qw(php php3 php4 php5 phps)),
290 (map { $_ => 'pl' } qw(pl perl pm)), # perhaps also 'cgi'
291 (map { $_ => 'make'} qw(make mak mk)),
292 (map { $_ => 'xml' } qw(xml xhtml html htm)),
61bf126e
AS
293);
294
ddb8d900
AK
295# You define site-wide feature defaults here; override them with
296# $GITWEB_CONFIG as necessary.
952c65fc 297our %feature = (
17848fc6
JN
298 # feature => {
299 # 'sub' => feature-sub (subroutine),
300 # 'override' => allow-override (boolean),
301 # 'default' => [ default options...] (array reference)}
302 #
b4b20b21 303 # if feature is overridable (it means that allow-override has true value),
17848fc6
JN
304 # then feature-sub will be called with default options as parameters;
305 # return value of feature-sub indicates if to enable specified feature
306 #
b4b20b21 307 # if there is no 'sub' key (no feature-sub), then feature cannot be
22e5e58a 308 # overridden
b4b20b21 309 #
ff3c0ff2
GB
310 # use gitweb_get_feature(<feature>) to retrieve the <feature> value
311 # (an array) or gitweb_check_feature(<feature>) to check if <feature>
312 # is enabled
952c65fc 313
45a3b12c
PB
314 # Enable the 'blame' blob view, showing the last commit that modified
315 # each line in the file. This can be very CPU-intensive.
316
317 # To enable system wide have in $GITWEB_CONFIG
318 # $feature{'blame'}{'default'} = [1];
319 # To have project specific config enable override in $GITWEB_CONFIG
320 # $feature{'blame'}{'override'} = 1;
321 # and in project config gitweb.blame = 0|1;
952c65fc 322 'blame' => {
cdad8170 323 'sub' => sub { feature_bool('blame', @_) },
952c65fc
JN
324 'override' => 0,
325 'default' => [0]},
326
a3c8ab30 327 # Enable the 'snapshot' link, providing a compressed archive of any
45a3b12c
PB
328 # tree. This can potentially generate high traffic if you have large
329 # project.
330
a3c8ab30
MM
331 # Value is a list of formats defined in %known_snapshot_formats that
332 # you wish to offer.
45a3b12c 333 # To disable system wide have in $GITWEB_CONFIG
a3c8ab30 334 # $feature{'snapshot'}{'default'} = [];
45a3b12c 335 # To have project specific config enable override in $GITWEB_CONFIG
bbee1d97 336 # $feature{'snapshot'}{'override'} = 1;
a3c8ab30
MM
337 # and in project config, a comma-separated list of formats or "none"
338 # to disable. Example: gitweb.snapshot = tbz2,zip;
952c65fc
JN
339 'snapshot' => {
340 'sub' => \&feature_snapshot,
341 'override' => 0,
a3c8ab30 342 'default' => ['tgz']},
04f7a94f 343
6be93511
RF
344 # Enable text search, which will list the commits which match author,
345 # committer or commit text to a given string. Enabled by default.
b4b20b21 346 # Project specific override is not supported.
e0ca3645
JN
347 #
348 # Note that this controls all search features, which means that if
349 # it is disabled, then 'grep' and 'pickaxe' search would also be
350 # disabled.
6be93511
RF
351 'search' => {
352 'override' => 0,
353 'default' => [1]},
354
e7738553
PB
355 # Enable grep search, which will list the files in currently selected
356 # tree containing the given string. Enabled by default. This can be
357 # potentially CPU-intensive, of course.
a598ded1 358 # Note that you need to have 'search' feature enabled too.
e7738553
PB
359
360 # To enable system wide have in $GITWEB_CONFIG
361 # $feature{'grep'}{'default'} = [1];
362 # To have project specific config enable override in $GITWEB_CONFIG
363 # $feature{'grep'}{'override'} = 1;
364 # and in project config gitweb.grep = 0|1;
365 'grep' => {
cdad8170 366 'sub' => sub { feature_bool('grep', @_) },
e7738553
PB
367 'override' => 0,
368 'default' => [1]},
369
45a3b12c
PB
370 # Enable the pickaxe search, which will list the commits that modified
371 # a given string in a file. This can be practical and quite faster
372 # alternative to 'blame', but still potentially CPU-intensive.
a598ded1 373 # Note that you need to have 'search' feature enabled too.
45a3b12c
PB
374
375 # To enable system wide have in $GITWEB_CONFIG
376 # $feature{'pickaxe'}{'default'} = [1];
377 # To have project specific config enable override in $GITWEB_CONFIG
378 # $feature{'pickaxe'}{'override'} = 1;
379 # and in project config gitweb.pickaxe = 0|1;
04f7a94f 380 'pickaxe' => {
cdad8170 381 'sub' => sub { feature_bool('pickaxe', @_) },
04f7a94f
JN
382 'override' => 0,
383 'default' => [1]},
9e756904 384
e4b48eaa
JN
385 # Enable showing size of blobs in a 'tree' view, in a separate
386 # column, similar to what 'ls -l' does. This cost a bit of IO.
387
388 # To disable system wide have in $GITWEB_CONFIG
389 # $feature{'show-sizes'}{'default'} = [0];
390 # To have project specific config enable override in $GITWEB_CONFIG
391 # $feature{'show-sizes'}{'override'} = 1;
392 # and in project config gitweb.showsizes = 0|1;
393 'show-sizes' => {
394 'sub' => sub { feature_bool('showsizes', @_) },
395 'override' => 0,
396 'default' => [1]},
397
45a3b12c
PB
398 # Make gitweb use an alternative format of the URLs which can be
399 # more readable and natural-looking: project name is embedded
400 # directly in the path and the query string contains other
401 # auxiliary information. All gitweb installations recognize
402 # URL in either format; this configures in which formats gitweb
403 # generates links.
404
405 # To enable system wide have in $GITWEB_CONFIG
406 # $feature{'pathinfo'}{'default'} = [1];
407 # Project specific override is not supported.
408
409 # Note that you will need to change the default location of CSS,
410 # favicon, logo and possibly other files to an absolute URL. Also,
411 # if gitweb.cgi serves as your indexfile, you will need to force
412 # $my_uri to contain the script name in your $GITWEB_CONFIG.
9e756904
MW
413 'pathinfo' => {
414 'override' => 0,
415 'default' => [0]},
e30496df
PB
416
417 # Make gitweb consider projects in project root subdirectories
418 # to be forks of existing projects. Given project $projname.git,
419 # projects matching $projname/*.git will not be shown in the main
420 # projects list, instead a '+' mark will be added to $projname
421 # there and a 'forks' view will be enabled for the project, listing
c2b8b134
FL
422 # all the forks. If project list is taken from a file, forks have
423 # to be listed after the main project.
e30496df
PB
424
425 # To enable system wide have in $GITWEB_CONFIG
426 # $feature{'forks'}{'default'} = [1];
427 # Project specific override is not supported.
428 'forks' => {
429 'override' => 0,
430 'default' => [0]},
d627f68f
PB
431
432 # Insert custom links to the action bar of all project pages.
433 # This enables you mainly to link to third-party scripts integrating
434 # into gitweb; e.g. git-browser for graphical history representation
435 # or custom web-based repository administration interface.
436
437 # The 'default' value consists of a list of triplets in the form
438 # (label, link, position) where position is the label after which
2b11e059 439 # to insert the link and link is a format string where %n expands
d627f68f
PB
440 # to the project name, %f to the project path within the filesystem,
441 # %h to the current hash (h gitweb parameter) and %b to the current
2b11e059 442 # hash base (hb gitweb parameter); %% expands to %.
d627f68f
PB
443
444 # To enable system wide have in $GITWEB_CONFIG e.g.
445 # $feature{'actions'}{'default'} = [('graphiclog',
446 # '/git-browser/by-commit.html?r=%n', 'summary')];
447 # Project specific override is not supported.
448 'actions' => {
449 'override' => 0,
450 'default' => []},
3e3d4ee7 451
0368c492
JN
452 # Allow gitweb scan project content tags of project repository,
453 # and display the popular Web 2.0-ish "tag cloud" near the projects
454 # list. Note that this is something COMPLETELY different from the
455 # normal Git tags.
aed93de4
PB
456
457 # gitweb by itself can show existing tags, but it does not handle
0368c492
JN
458 # tagging itself; you need to do it externally, outside gitweb.
459 # The format is described in git_get_project_ctags() subroutine.
aed93de4
PB
460 # You may want to install the HTML::TagCloud Perl module to get
461 # a pretty tag cloud instead of just a list of tags.
462
463 # To enable system wide have in $GITWEB_CONFIG
0368c492 464 # $feature{'ctags'}{'default'} = [1];
aed93de4 465 # Project specific override is not supported.
0368c492
JN
466
467 # In the future whether ctags editing is enabled might depend
468 # on the value, but using 1 should always mean no editing of ctags.
aed93de4
PB
469 'ctags' => {
470 'override' => 0,
471 'default' => [0]},
9872cd6f
GB
472
473 # The maximum number of patches in a patchset generated in patch
474 # view. Set this to 0 or undef to disable patch view, or to a
475 # negative number to remove any limit.
476
477 # To disable system wide have in $GITWEB_CONFIG
478 # $feature{'patches'}{'default'} = [0];
479 # To have project specific config enable override in $GITWEB_CONFIG
480 # $feature{'patches'}{'override'} = 1;
481 # and in project config gitweb.patches = 0|n;
482 # where n is the maximum number of patches allowed in a patchset.
483 'patches' => {
484 'sub' => \&feature_patches,
485 'override' => 0,
486 'default' => [16]},
e9fdd74e
GB
487
488 # Avatar support. When this feature is enabled, views such as
489 # shortlog or commit will display an avatar associated with
490 # the email of the committer(s) and/or author(s).
491
679a1a1d
GB
492 # Currently available providers are gravatar and picon.
493 # If an unknown provider is specified, the feature is disabled.
494
679a1a1d 495 # Picon currently relies on the indiana.edu database.
e9fdd74e
GB
496
497 # To enable system wide have in $GITWEB_CONFIG
679a1a1d
GB
498 # $feature{'avatar'}{'default'} = ['<provider>'];
499 # where <provider> is either gravatar or picon.
e9fdd74e
GB
500 # To have project specific config enable override in $GITWEB_CONFIG
501 # $feature{'avatar'}{'override'} = 1;
679a1a1d 502 # and in project config gitweb.avatar = <provider>;
e9fdd74e
GB
503 'avatar' => {
504 'sub' => \&feature_avatar,
505 'override' => 0,
506 'default' => ['']},
aa7dd05e
JN
507
508 # Enable displaying how much time and how many git commands
509 # it took to generate and display page. Disabled by default.
510 # Project specific override is not supported.
511 'timed' => {
512 'override' => 0,
513 'default' => [0]},
e627e50a
JN
514
515 # Enable turning some links into links to actions which require
516 # JavaScript to run (like 'blame_incremental'). Not enabled by
517 # default. Project specific override is currently not supported.
518 'javascript-actions' => {
519 'override' => 0,
520 'default' => [0]},
b331fe54 521
2e987f92
JN
522 # Enable and configure ability to change common timezone for dates
523 # in gitweb output via JavaScript. Enabled by default.
524 # Project specific override is not supported.
525 'javascript-timezone' => {
526 'override' => 0,
527 'default' => [
528 'local', # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
529 # or undef to turn off this feature
530 'gitweb_tz', # name of cookie where to store selected timezone
531 'datetime', # CSS class used to mark up dates for manipulation
532 ]},
533
b331fe54
JS
534 # Syntax highlighting support. This is based on Daniel Svensson's
535 # and Sham Chukoury's work in gitweb-xmms2.git.
592ea417
JN
536 # It requires the 'highlight' program present in $PATH,
537 # and therefore is disabled by default.
b331fe54
JS
538
539 # To enable system wide have in $GITWEB_CONFIG
540 # $feature{'highlight'}{'default'} = [1];
541
542 'highlight' => {
543 'sub' => sub { feature_bool('highlight', @_) },
544 'override' => 0,
545 'default' => [0]},
60efa245
GB
546
547 # Enable displaying of remote heads in the heads list
548
549 # To enable system wide have in $GITWEB_CONFIG
550 # $feature{'remote_heads'}{'default'} = [1];
551 # To have project specific config enable override in $GITWEB_CONFIG
552 # $feature{'remote_heads'}{'override'} = 1;
af507944 553 # and in project config gitweb.remoteheads = 0|1;
60efa245
GB
554 'remote_heads' => {
555 'sub' => sub { feature_bool('remote_heads', @_) },
556 'override' => 0,
557 'default' => [0]},
8d646a9b
KN
558
559 # Enable showing branches under other refs in addition to heads
560
561 # To set system wide extra branch refs have in $GITWEB_CONFIG
562 # $feature{'extra-branch-refs'}{'default'} = ['dirs', 'of', 'choice'];
563 # To have project specific config enable override in $GITWEB_CONFIG
564 # $feature{'extra-branch-refs'}{'override'} = 1;
565 # and in project config gitweb.extrabranchrefs = dirs of choice
566 # Every directory is separated with whitespace.
567
568 'extra-branch-refs' => {
569 'sub' => \&feature_extra_branch_refs,
570 'override' => 0,
571 'default' => []},
ddb8d900
AK
572);
573
a7c5a283 574sub gitweb_get_feature {
ddb8d900 575 my ($name) = @_;
dd1ad5f1 576 return unless exists $feature{$name};
952c65fc
JN
577 my ($sub, $override, @defaults) = (
578 $feature{$name}{'sub'},
579 $feature{$name}{'override'},
580 @{$feature{$name}{'default'}});
9be3614e
JN
581 # project specific override is possible only if we have project
582 our $git_dir; # global variable, declared later
583 if (!$override || !defined $git_dir) {
584 return @defaults;
585 }
a9455919 586 if (!defined $sub) {
93197898 587 warn "feature $name is not overridable";
a9455919
MW
588 return @defaults;
589 }
ddb8d900
AK
590 return $sub->(@defaults);
591}
592
25b2790f
GB
593# A wrapper to check if a given feature is enabled.
594# With this, you can say
595#
596# my $bool_feat = gitweb_check_feature('bool_feat');
597# gitweb_check_feature('bool_feat') or somecode;
598#
599# instead of
600#
601# my ($bool_feat) = gitweb_get_feature('bool_feat');
602# (gitweb_get_feature('bool_feat'))[0] or somecode;
603#
604sub gitweb_check_feature {
605 return (gitweb_get_feature(@_))[0];
606}
607
608
cdad8170
MK
609sub feature_bool {
610 my $key = shift;
611 my ($val) = git_get_project_config($key, '--bool');
ddb8d900 612
df5d10a3
MC
613 if (!defined $val) {
614 return ($_[0]);
615 } elsif ($val eq 'true') {
cdad8170 616 return (1);
ddb8d900 617 } elsif ($val eq 'false') {
cdad8170 618 return (0);
ddb8d900 619 }
ddb8d900
AK
620}
621
ddb8d900 622sub feature_snapshot {
a3c8ab30 623 my (@fmts) = @_;
ddb8d900
AK
624
625 my ($val) = git_get_project_config('snapshot');
626
a3c8ab30
MM
627 if ($val) {
628 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
ddb8d900
AK
629 }
630
a3c8ab30 631 return @fmts;
de9272f4
LT
632}
633
9872cd6f
GB
634sub feature_patches {
635 my @val = (git_get_project_config('patches', '--int'));
636
637 if (@val) {
638 return @val;
639 }
640
641 return ($_[0]);
642}
643
e9fdd74e
GB
644sub feature_avatar {
645 my @val = (git_get_project_config('avatar'));
646
647 return @val ? @val : @_;
648}
649
8d646a9b
KN
650sub feature_extra_branch_refs {
651 my (@branch_refs) = @_;
652 my $values = git_get_project_config('extrabranchrefs');
653
654 if ($values) {
655 $values = config_to_multi ($values);
656 @branch_refs = ();
657 foreach my $value (@{$values}) {
658 push @branch_refs, split /\s+/, $value;
659 }
660 }
661
662 return @branch_refs;
663}
664
2172ce4b
JH
665# checking HEAD file with -e is fragile if the repository was
666# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
667# and then pruned.
668sub check_head_link {
669 my ($dir) = @_;
670 my $headfile = "$dir/HEAD";
671 return ((-e $headfile) ||
672 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
673}
674
675sub check_export_ok {
676 my ($dir) = @_;
677 return (check_head_link($dir) &&
dd7f5f10
AG
678 (!$export_ok || -e "$dir/$export_ok") &&
679 (!$export_auth_hook || $export_auth_hook->($dir)));
2172ce4b
JH
680}
681
a781785d
JN
682# process alternate names for backward compatibility
683# filter out unsupported (unknown) snapshot formats
684sub filter_snapshot_fmts {
685 my @fmts = @_;
686
687 @fmts = map {
688 exists $known_snapshot_format_aliases{$_} ?
689 $known_snapshot_format_aliases{$_} : $_} @fmts;
68cedb1f 690 @fmts = grep {
1bfd3631
MR
691 exists $known_snapshot_formats{$_} &&
692 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
a781785d
JN
693}
694
8d646a9b
KN
695sub filter_and_validate_refs {
696 my @refs = @_;
697 my %unique_refs = ();
698
699 foreach my $ref (@refs) {
700 die_error(500, "Invalid ref '$ref' in 'extra-branch-refs' feature") unless (is_valid_ref_format($ref));
701 # 'heads' are added implicitly in get_branch_refs().
702 $unique_refs{$ref} = 1 if ($ref ne 'heads');
703 }
704 return sort keys %unique_refs;
705}
706
da4b2432
JN
707# If it is set to code reference, it is code that it is to be run once per
708# request, allowing updating configurations that change with each request,
709# while running other code in config file only once.
710#
711# Otherwise, if it is false then gitweb would process config file only once;
712# if it is true then gitweb config would be run for each request.
713our $per_request_config = 1;
714
f612a71c
JN
715# read and parse gitweb config file given by its parameter.
716# returns true on success, false on recoverable error, allowing
717# to chain this subroutine, using first file that exists.
718# dies on errors during parsing config file, as it is unrecoverable.
719sub read_config_file {
720 my $filename = shift;
721 return unless defined $filename;
722 # die if there are errors parsing config file
723 if (-e $filename) {
724 do $filename;
725 die $@ if $@;
726 return 1;
727 }
728 return;
729}
730
131d6afc 731our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
c2394fe9
JN
732sub evaluate_gitweb_config {
733 our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
734 our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
131d6afc 735 our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
f612a71c 736
41ccfdd9 737 # Protect against duplications of file names, to not read config twice.
131d6afc
JN
738 # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
739 # there possibility of duplication of filename there doesn't matter.
740 $GITWEB_CONFIG = "" if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
741 $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
742
743 # Common system-wide settings for convenience.
744 # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
745 read_config_file($GITWEB_CONFIG_COMMON);
746
747 # Use first config file that exists. This means use the per-instance
748 # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
749 read_config_file($GITWEB_CONFIG) and return;
f612a71c 750 read_config_file($GITWEB_CONFIG_SYSTEM);
17a8b250 751}
c8d138a8 752
b62a1a98
JWH
753# Get loadavg of system, to compare against $maxload.
754# Currently it requires '/proc/loadavg' present to get loadavg;
755# if it is not present it returns 0, which means no load checking.
756sub get_loadavg {
757 if( -e '/proc/loadavg' ){
758 open my $fd, '<', '/proc/loadavg'
759 or return 0;
760 my @load = split(/\s+/, scalar <$fd>);
761 close $fd;
762
763 # The first three columns measure CPU and IO utilization of the last one,
764 # five, and 10 minute periods. The fourth column shows the number of
765 # currently running processes and the total number of processes in the m/n
766 # format. The last column displays the last process ID used.
767 return $load[0] || 0;
768 }
769 # additional checks for load average should go here for things that don't export
770 # /proc/loadavg
771
772 return 0;
773}
774
c8d138a8 775# version of the core git binary
c2394fe9
JN
776our $git_version;
777sub evaluate_git_version {
778 our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
779 $number_of_git_cmds++;
780}
c8d138a8 781
c2394fe9
JN
782sub check_loadavg {
783 if (defined $maxload && get_loadavg() > $maxload) {
784 die_error(503, "The load average on the server is too high");
785 }
b62a1a98
JWH
786}
787
154b4d78 788# ======================================================================
09bd7898 789# input validation and dispatch
1b2d297e 790
cfb04911 791# Various hash size-related values.
792my $sha1_len = 40;
793my $sha256_extra_len = 24;
794my $sha256_len = $sha1_len + $sha256_extra_len;
795
796# A regex matching $len hex characters. $len may be a range (e.g. 7,64).
797sub oid_nlen_regex {
798 my $len = shift;
799 my $hchr = qr/[0-9a-fA-F]/;
800 return qr/(?:(?:$hchr){$len})/;
801}
802
803# A regex matching two sets of $nlen hex characters, prefixed by the literal
804# string $prefix and with the literal string $infix between them.
805sub oid_nlen_prefix_infix_regex {
806 my $nlen = shift;
807 my $prefix = shift;
808 my $infix = shift;
809
810 my $rx = oid_nlen_regex($nlen);
811
812 return qr/^\Q$prefix\E$rx\Q$infix\E$rx$/;
813}
814
815# A regex matching a valid object ID.
816our $oid_regex;
817{
818 my $x = oid_nlen_regex($sha1_len);
819 my $y = oid_nlen_regex($sha256_extra_len);
820 $oid_regex = qr/(?:$x(?:$y)?)/;
821}
822
1b2d297e
GB
823# input parameters can be collected from a variety of sources (presently, CGI
824# and PATH_INFO), so we define an %input_params hash that collects them all
825# together during validation: this allows subsequent uses (e.g. href()) to be
826# agnostic of the parameter origin
827
dde80d9c 828our %input_params = ();
1b2d297e
GB
829
830# input parameters are stored with the long parameter name as key. This will
831# also be used in the href subroutine to convert parameters to their CGI
832# equivalent, and since the href() usage is the most frequent one, we store
833# the name -> CGI key mapping here, instead of the reverse.
834#
835# XXX: Warning: If you touch this, check the search form for updating,
836# too.
837
dde80d9c 838our @cgi_param_mapping = (
1b2d297e
GB
839 project => "p",
840 action => "a",
841 file_name => "f",
842 file_parent => "fp",
843 hash => "h",
844 hash_parent => "hp",
845 hash_base => "hb",
846 hash_parent_base => "hpb",
847 page => "pg",
848 order => "o",
849 searchtext => "s",
850 searchtype => "st",
851 snapshot_format => "sf",
852 extra_options => "opt",
853 search_use_regexp => "sr",
0368c492 854 ctag => "by_tag",
6ba1eb51 855 diff_style => "ds",
19d2d239 856 project_filter => "pf",
c4ccf61f
JN
857 # this must be last entry (for manipulation from JavaScript)
858 javascript => "js"
1b2d297e 859);
dde80d9c 860our %cgi_param_mapping = @cgi_param_mapping;
1b2d297e
GB
861
862# we will also need to know the possible actions, for validation
dde80d9c 863our %actions = (
1b2d297e 864 "blame" => \&git_blame,
4af819d4
JN
865 "blame_incremental" => \&git_blame_incremental,
866 "blame_data" => \&git_blame_data,
1b2d297e
GB
867 "blobdiff" => \&git_blobdiff,
868 "blobdiff_plain" => \&git_blobdiff_plain,
869 "blob" => \&git_blob,
870 "blob_plain" => \&git_blob_plain,
871 "commitdiff" => \&git_commitdiff,
872 "commitdiff_plain" => \&git_commitdiff_plain,
873 "commit" => \&git_commit,
874 "forks" => \&git_forks,
875 "heads" => \&git_heads,
876 "history" => \&git_history,
877 "log" => \&git_log,
9872cd6f 878 "patch" => \&git_patch,
a3411f8a 879 "patches" => \&git_patches,
00fa6fef 880 "remotes" => \&git_remotes,
1b2d297e
GB
881 "rss" => \&git_rss,
882 "atom" => \&git_atom,
883 "search" => \&git_search,
884 "search_help" => \&git_search_help,
885 "shortlog" => \&git_shortlog,
886 "summary" => \&git_summary,
887 "tag" => \&git_tag,
888 "tags" => \&git_tags,
889 "tree" => \&git_tree,
890 "snapshot" => \&git_snapshot,
891 "object" => \&git_object,
892 # those below don't need $project
893 "opml" => \&git_opml,
894 "project_list" => \&git_project_list,
895 "project_index" => \&git_project_index,
896);
897
898# finally, we have the hash of allowed extra_options for the commands that
899# allow them
dde80d9c 900our %allowed_options = (
1b2d297e
GB
901 "--no-merges" => [ qw(rss atom log shortlog history) ],
902);
903
904# fill %input_params with the CGI parameters. All values except for 'opt'
905# should be single values, but opt can be an array. We should probably
906# build an array of parameters that can be multi-valued, but since for the time
907# being it's only this one, we just single it out
c2394fe9
JN
908sub evaluate_query_params {
909 our $cgi;
910
911 while (my ($name, $symbol) = each %cgi_param_mapping) {
912 if ($symbol eq 'opt') {
13dbf46a 913 $input_params{$name} = [ map { decode_utf8($_) } $cgi->multi_param($symbol) ];
c2394fe9 914 } else {
84d9e2d5 915 $input_params{$name} = decode_utf8($cgi->param($symbol));
c2394fe9 916 }
1b2d297e
GB
917 }
918}
919
920# now read PATH_INFO and update the parameter list for missing parameters
921sub evaluate_path_info {
922 return if defined $input_params{'project'};
923 return if !$path_info;
924 $path_info =~ s,^/+,,;
925 return if !$path_info;
926
927 # find which part of PATH_INFO is project
928 my $project = $path_info;
929 $project =~ s,/+$,,;
930 while ($project && !check_head_link("$projectroot/$project")) {
931 $project =~ s,/*[^/]*$,,;
932 }
933 return unless $project;
934 $input_params{'project'} = $project;
935
936 # do not change any parameters if an action is given using the query string
937 return if $input_params{'action'};
938 $path_info =~ s,^\Q$project\E/*,,;
939
d8c28822
GB
940 # next, check if we have an action
941 my $action = $path_info;
942 $action =~ s,/.*$,,;
943 if (exists $actions{$action}) {
944 $path_info =~ s,^$action/*,,;
945 $input_params{'action'} = $action;
946 }
947
948 # list of actions that want hash_base instead of hash, but can have no
949 # pathname (f) parameter
950 my @wants_base = (
951 'tree',
952 'history',
953 );
954
7e00dc58 955 # we want to catch, among others
b0be3838
GB
956 # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
957 my ($parentrefname, $parentpathname, $refname, $pathname) =
7e00dc58 958 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
b0be3838
GB
959
960 # first, analyze the 'current' part
1b2d297e 961 if (defined $pathname) {
d8c28822
GB
962 # we got "branch:filename" or "branch:dir/"
963 # we could use git_get_type(branch:pathname), but:
964 # - it needs $git_dir
965 # - it does a git() call
966 # - the convention of terminating directories with a slash
967 # makes it superfluous
968 # - embedding the action in the PATH_INFO would make it even
969 # more superfluous
1b2d297e
GB
970 $pathname =~ s,^/+,,;
971 if (!$pathname || substr($pathname, -1) eq "/") {
d8c28822 972 $input_params{'action'} ||= "tree";
1b2d297e
GB
973 $pathname =~ s,/$,,;
974 } else {
b0be3838
GB
975 # the default action depends on whether we had parent info
976 # or not
977 if ($parentrefname) {
978 $input_params{'action'} ||= "blobdiff_plain";
979 } else {
980 $input_params{'action'} ||= "blob_plain";
981 }
1b2d297e
GB
982 }
983 $input_params{'hash_base'} ||= $refname;
984 $input_params{'file_name'} ||= $pathname;
985 } elsif (defined $refname) {
d8c28822
GB
986 # we got "branch". In this case we have to choose if we have to
987 # set hash or hash_base.
988 #
989 # Most of the actions without a pathname only want hash to be
990 # set, except for the ones specified in @wants_base that want
991 # hash_base instead. It should also be noted that hand-crafted
992 # links having 'history' as an action and no pathname or hash
993 # set will fail, but that happens regardless of PATH_INFO.
d0af3734
JN
994 if (defined $parentrefname) {
995 # if there is parent let the default be 'shortlog' action
996 # (for http://git.example.com/repo.git/A..B links); if there
997 # is no parent, dispatch will detect type of object and set
998 # action appropriately if required (if action is not set)
999 $input_params{'action'} ||= "shortlog";
1000 }
1001 if ($input_params{'action'} &&
1002 grep { $_ eq $input_params{'action'} } @wants_base) {
d8c28822
GB
1003 $input_params{'hash_base'} ||= $refname;
1004 } else {
1005 $input_params{'hash'} ||= $refname;
1006 }
1b2d297e 1007 }
b0be3838
GB
1008
1009 # next, handle the 'parent' part, if present
1010 if (defined $parentrefname) {
1011 # a missing pathspec defaults to the 'current' filename, allowing e.g.
1012 # someproject/blobdiff/oldrev..newrev:/filename
1013 if ($parentpathname) {
1014 $parentpathname =~ s,^/+,,;
1015 $parentpathname =~ s,/$,,;
1016 $input_params{'file_parent'} ||= $parentpathname;
1017 } else {
1018 $input_params{'file_parent'} ||= $input_params{'file_name'};
1019 }
1020 # we assume that hash_parent_base is wanted if a path was specified,
1021 # or if the action wants hash_base instead of hash
1022 if (defined $input_params{'file_parent'} ||
1023 grep { $_ eq $input_params{'action'} } @wants_base) {
1024 $input_params{'hash_parent_base'} ||= $parentrefname;
1025 } else {
1026 $input_params{'hash_parent'} ||= $parentrefname;
1027 }
1028 }
1ec2fb5f
GB
1029
1030 # for the snapshot action, we allow URLs in the form
1031 # $project/snapshot/$hash.ext
1032 # where .ext determines the snapshot and gets removed from the
1033 # passed $refname to provide the $hash.
1034 #
1035 # To be able to tell that $refname includes the format extension, we
1036 # require the following two conditions to be satisfied:
1037 # - the hash input parameter MUST have been set from the $refname part
1038 # of the URL (i.e. they must be equal)
1039 # - the snapshot format MUST NOT have been defined already (e.g. from
1040 # CGI parameter sf)
1041 # It's also useless to try any matching unless $refname has a dot,
1042 # so we check for that too
1043 if (defined $input_params{'action'} &&
1044 $input_params{'action'} eq 'snapshot' &&
1045 defined $refname && index($refname, '.') != -1 &&
1046 $refname eq $input_params{'hash'} &&
1047 !defined $input_params{'snapshot_format'}) {
1048 # We loop over the known snapshot formats, checking for
1049 # extensions. Allowed extensions are both the defined suffix
1050 # (which includes the initial dot already) and the snapshot
1051 # format key itself, with a prepended dot
ccb4b539 1052 while (my ($fmt, $opt) = each %known_snapshot_formats) {
1ec2fb5f 1053 my $hash = $refname;
095e9142
JN
1054 unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
1055 next;
1056 }
1057 my $sfx = $1;
1ec2fb5f
GB
1058 # a valid suffix was found, so set the snapshot format
1059 # and reset the hash parameter
1060 $input_params{'snapshot_format'} = $fmt;
1061 $input_params{'hash'} = $hash;
1062 # we also set the format suffix to the one requested
1063 # in the URL: this way a request for e.g. .tgz returns
1064 # a .tgz instead of a .tar.gz
1065 $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
1066 last;
1067 }
1068 }
1b2d297e 1069}
1b2d297e 1070
c2394fe9
JN
1071our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
1072 $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
19d2d239 1073 $searchtext, $search_regexp, $project_filter);
c2394fe9
JN
1074sub evaluate_and_validate_params {
1075 our $action = $input_params{'action'};
1076 if (defined $action) {
23faf546 1077 if (!is_valid_action($action)) {
c2394fe9
JN
1078 die_error(400, "Invalid action parameter");
1079 }
b87d78d6 1080 }
44ad2978 1081
c2394fe9
JN
1082 # parameters which are pathnames
1083 our $project = $input_params{'project'};
1084 if (defined $project) {
23faf546 1085 if (!is_valid_project($project)) {
c2394fe9
JN
1086 undef $project;
1087 die_error(404, "No such project");
1088 }
9cd3d988 1089 }
6191f8e1 1090
19d2d239
BL
1091 our $project_filter = $input_params{'project_filter'};
1092 if (defined $project_filter) {
23faf546 1093 if (!is_valid_pathname($project_filter)) {
19d2d239
BL
1094 die_error(404, "Invalid project_filter parameter");
1095 }
1096 }
1097
c2394fe9
JN
1098 our $file_name = $input_params{'file_name'};
1099 if (defined $file_name) {
23faf546 1100 if (!is_valid_pathname($file_name)) {
c2394fe9
JN
1101 die_error(400, "Invalid file parameter");
1102 }
24d0693a 1103 }
24d0693a 1104
c2394fe9
JN
1105 our $file_parent = $input_params{'file_parent'};
1106 if (defined $file_parent) {
23faf546 1107 if (!is_valid_pathname($file_parent)) {
c2394fe9
JN
1108 die_error(400, "Invalid file parent parameter");
1109 }
24d0693a 1110 }
5c95fab0 1111
c2394fe9
JN
1112 # parameters which are refnames
1113 our $hash = $input_params{'hash'};
1114 if (defined $hash) {
23faf546 1115 if (!is_valid_refname($hash)) {
c2394fe9
JN
1116 die_error(400, "Invalid hash parameter");
1117 }
4fac5294 1118 }
6191f8e1 1119
c2394fe9
JN
1120 our $hash_parent = $input_params{'hash_parent'};
1121 if (defined $hash_parent) {
23faf546 1122 if (!is_valid_refname($hash_parent)) {
c2394fe9
JN
1123 die_error(400, "Invalid hash parent parameter");
1124 }
c91da262 1125 }
09bd7898 1126
c2394fe9
JN
1127 our $hash_base = $input_params{'hash_base'};
1128 if (defined $hash_base) {
23faf546 1129 if (!is_valid_refname($hash_base)) {
c2394fe9
JN
1130 die_error(400, "Invalid hash base parameter");
1131 }
c91da262 1132 }
6191f8e1 1133
c2394fe9
JN
1134 our @extra_options = @{$input_params{'extra_options'}};
1135 # @extra_options is always defined, since it can only be (currently) set from
1136 # CGI, and $cgi->param() returns the empty array in array context if the param
1137 # is not set
1138 foreach my $opt (@extra_options) {
1139 if (not exists $allowed_options{$opt}) {
1140 die_error(400, "Invalid option parameter");
1141 }
1142 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1143 die_error(400, "Invalid option parameter for this action");
1144 }
868bc068 1145 }
868bc068 1146
c2394fe9
JN
1147 our $hash_parent_base = $input_params{'hash_parent_base'};
1148 if (defined $hash_parent_base) {
23faf546 1149 if (!is_valid_refname($hash_parent_base)) {
c2394fe9
JN
1150 die_error(400, "Invalid hash parent base parameter");
1151 }
420e92f2 1152 }
420e92f2 1153
c2394fe9
JN
1154 # other parameters
1155 our $page = $input_params{'page'};
1156 if (defined $page) {
1157 if ($page =~ m/[^0-9]/) {
1158 die_error(400, "Invalid page parameter");
1159 }
b87d78d6 1160 }
823d5dc8 1161
c2394fe9
JN
1162 our $searchtype = $input_params{'searchtype'};
1163 if (defined $searchtype) {
1164 if ($searchtype =~ m/[^a-z]/) {
1165 die_error(400, "Invalid searchtype parameter");
1166 }
e7738553 1167 }
e7738553 1168
c2394fe9 1169 our $search_use_regexp = $input_params{'search_use_regexp'};
0e559919 1170
c2394fe9 1171 our $searchtext = $input_params{'searchtext'};
ca7a5dcf 1172 our $search_regexp = undef;
c2394fe9
JN
1173 if (defined $searchtext) {
1174 if (length($searchtext) < 2) {
1175 die_error(403, "At least two characters are required for search parameter");
1176 }
36612e4d
JN
1177 if ($search_use_regexp) {
1178 $search_regexp = $searchtext;
1179 if (!eval { qr/$search_regexp/; 1; }) {
1180 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1181 die_error(400, "Invalid search regexp '$search_regexp'",
1182 esc_html($error));
1183 }
1184 } else {
1185 $search_regexp = quotemeta $searchtext;
1186 }
9d032c72 1187 }
19806691
KS
1188}
1189
645927ce
ML
1190# path to the current git repository
1191our $git_dir;
c2394fe9
JN
1192sub evaluate_git_dir {
1193 our $git_dir = "$projectroot/$project" if $project;
e9fdd74e
GB
1194}
1195
8d646a9b 1196our (@snapshot_fmts, $git_avatar, @extra_branch_refs);
c2394fe9
JN
1197sub configure_gitweb_features {
1198 # list of supported snapshot formats
1199 our @snapshot_fmts = gitweb_get_feature('snapshot');
1200 @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1201
c2394fe9 1202 our ($git_avatar) = gitweb_get_feature('avatar');
7d5b30e0 1203 $git_avatar = '' unless $git_avatar =~ /^(?:gravatar|picon)$/s;
8d646a9b
KN
1204
1205 our @extra_branch_refs = gitweb_get_feature('extra-branch-refs');
1206 @extra_branch_refs = filter_and_validate_refs (@extra_branch_refs);
1207}
1208
1209sub get_branch_refs {
1210 return ('heads', @extra_branch_refs);
e9fdd74e
GB
1211}
1212
7a597457
JN
1213# custom error handler: 'die <message>' is Internal Server Error
1214sub handle_errors_html {
1215 my $msg = shift; # it is already HTML escaped
1216
1217 # to avoid infinite loop where error occurs in die_error,
1218 # change handler to default handler, disabling handle_errors_html
41ccfdd9 1219 set_message("Error occurred when inside die_error:\n$msg");
7a597457
JN
1220
1221 # you cannot jump out of die_error when called as error handler;
1222 # the subroutine set via CGI::Carp::set_message is called _after_
1223 # HTTP headers are already written, so it cannot write them itself
1224 die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1225}
1226set_message(\&handle_errors_html);
1227
717b8311 1228# dispatch
c2394fe9
JN
1229sub dispatch {
1230 if (!defined $action) {
1231 if (defined $hash) {
1232 $action = git_get_type($hash);
18ab83e8 1233 $action or die_error(404, "Object does not exist");
c2394fe9
JN
1234 } elsif (defined $hash_base && defined $file_name) {
1235 $action = git_get_type("$hash_base:$file_name");
18ab83e8 1236 $action or die_error(404, "File or directory does not exist");
c2394fe9
JN
1237 } elsif (defined $project) {
1238 $action = 'summary';
1239 } else {
1240 $action = 'project_list';
1241 }
7f9778b1 1242 }
c2394fe9
JN
1243 if (!defined($actions{$action})) {
1244 die_error(400, "Unknown action");
1245 }
1246 if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1247 !$project) {
1248 die_error(400, "Project needed");
1249 }
1250 $actions{$action}->();
77a153fd 1251}
c2394fe9 1252
869d5881 1253sub reset_timer {
3962f1d7 1254 our $t0 = [ gettimeofday() ]
c2394fe9 1255 if defined $t0;
869d5881
JN
1256 our $number_of_git_cmds = 0;
1257}
1258
da4b2432 1259our $first_request = 1;
869d5881
JN
1260sub run_request {
1261 reset_timer();
c2394fe9
JN
1262
1263 evaluate_uri();
da4b2432
JN
1264 if ($first_request) {
1265 evaluate_gitweb_config();
1266 evaluate_git_version();
1267 }
1268 if ($per_request_config) {
1269 if (ref($per_request_config) eq 'CODE') {
1270 $per_request_config->();
1271 } elsif (!$first_request) {
1272 evaluate_gitweb_config();
1273 }
1274 }
c2394fe9
JN
1275 check_loadavg();
1276
7f425db9
JN
1277 # $projectroot and $projects_list might be set in gitweb config file
1278 $projects_list ||= $projectroot;
1279
c2394fe9
JN
1280 evaluate_query_params();
1281 evaluate_path_info();
1282 evaluate_and_validate_params();
1283 evaluate_git_dir();
1284
1285 configure_gitweb_features();
1286
1287 dispatch();
09bd7898 1288}
a0446e7b
SV
1289
1290our $is_last_request = sub { 1 };
1291our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1292our $CGI = 'CGI';
1293our $cgi;
45aa9895
JN
1294sub configure_as_fcgi {
1295 require CGI::Fast;
1296 our $CGI = 'CGI::Fast';
1297
1298 my $request_number = 0;
1299 # let each child service 100 requests
1300 our $is_last_request = sub { ++$request_number > 100 };
d04d3d42 1301}
a0446e7b 1302sub evaluate_argv {
45aa9895
JN
1303 my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1304 configure_as_fcgi()
1305 if $script_name =~ /\.fcgi$/;
1306
a0446e7b
SV
1307 return unless (@ARGV);
1308
1309 require Getopt::Long;
1310 Getopt::Long::GetOptions(
45aa9895 1311 'fastcgi|fcgi|f' => \&configure_as_fcgi,
a0446e7b
SV
1312 'nproc|n=i' => sub {
1313 my ($arg, $val) = @_;
1314 return unless eval { require FCGI::ProcManager; 1; };
1315 my $proc_manager = FCGI::ProcManager->new({
1316 n_processes => $val,
1317 });
1318 our $pre_listen_hook = sub { $proc_manager->pm_manage() };
1319 our $pre_dispatch_hook = sub { $proc_manager->pm_pre_dispatch() };
1320 our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1321 },
1322 );
1323}
1324
1325sub run {
1326 evaluate_argv();
869d5881 1327
da4b2432 1328 $first_request = 1;
a0446e7b
SV
1329 $pre_listen_hook->()
1330 if $pre_listen_hook;
1331
1332 REQUEST:
1333 while ($cgi = $CGI->new()) {
1334 $pre_dispatch_hook->()
1335 if $pre_dispatch_hook;
1336
1337 run_request();
1338
0b45010e 1339 $post_dispatch_hook->()
a0446e7b 1340 if $post_dispatch_hook;
da4b2432 1341 $first_request = 0;
a0446e7b
SV
1342
1343 last REQUEST if ($is_last_request->());
1344 }
c2394fe9
JN
1345
1346 DONE_GITWEB:
1347 1;
d04d3d42 1348}
a0446e7b 1349
c2394fe9 1350run();
09bd7898 1351
5ed2ec10
JN
1352if (defined caller) {
1353 # wrapped in a subroutine processing requests,
1354 # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1355 return;
1356} else {
1357 # pure CGI script, serving single request
1358 exit;
1359}
09bd7898 1360
06a9d86b
MW
1361## ======================================================================
1362## action links
1363
377bee34
JN
1364# possible values of extra options
1365# -full => 0|1 - use absolute/full URL ($my_uri/$my_url as base)
1366# -replay => 1 - start from a current view (replay with modifications)
1367# -path_info => 0|1 - don't use/use path_info URL (if possible)
5e96a847 1368# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
74fd8728 1369sub href {
498fe002 1370 my %params = @_;
bd5d1e42
JN
1371 # default is to use -absolute url() i.e. $my_uri
1372 my $href = $params{-full} ? $my_url : $my_uri;
498fe002 1373
5e96a847
KC
1374 # implicit -replay, must be first of implicit params
1375 $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1376
afa9b620
JN
1377 $params{'project'} = $project unless exists $params{'project'};
1378
1cad283a 1379 if ($params{-replay}) {
1b2d297e 1380 while (my ($name, $symbol) = each %cgi_param_mapping) {
1cad283a 1381 if (!exists $params{$name}) {
1b2d297e 1382 $params{$name} = $input_params{$name};
1cad283a
JN
1383 }
1384 }
1385 }
1386
25b2790f 1387 my $use_pathinfo = gitweb_check_feature('pathinfo');
377bee34
JN
1388 if (defined $params{'project'} &&
1389 (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
b02bd7a6
GB
1390 # try to put as many parameters as possible in PATH_INFO:
1391 # - project name
1392 # - action
8db49a7f 1393 # - hash_parent or hash_parent_base:/file_parent
3550ea71 1394 # - hash or hash_base:/filename
c752a0e0 1395 # - the snapshot_format as an appropriate suffix
b02bd7a6
GB
1396
1397 # When the script is the root DirectoryIndex for the domain,
1398 # $href here would be something like http://gitweb.example.com/
1399 # Thus, we strip any trailing / from $href, to spare us double
1400 # slashes in the final URL
1401 $href =~ s,/$,,;
1402
1403 # Then add the project name, if present
67976c65 1404 $href .= "/".esc_path_info($params{'project'});
9e756904
MW
1405 delete $params{'project'};
1406
c752a0e0
GB
1407 # since we destructively absorb parameters, we keep this
1408 # boolean that remembers if we're handling a snapshot
1409 my $is_snapshot = $params{'action'} eq 'snapshot';
1410
b02bd7a6
GB
1411 # Summary just uses the project path URL, any other action is
1412 # added to the URL
1413 if (defined $params{'action'}) {
67976c65
JN
1414 $href .= "/".esc_path_info($params{'action'})
1415 unless $params{'action'} eq 'summary';
9e756904
MW
1416 delete $params{'action'};
1417 }
b02bd7a6 1418
8db49a7f
GB
1419 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1420 # stripping nonexistent or useless pieces
1421 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1422 || $params{'hash_parent'} || $params{'hash'});
b02bd7a6 1423 if (defined $params{'hash_base'}) {
8db49a7f 1424 if (defined $params{'hash_parent_base'}) {
67976c65 1425 $href .= esc_path_info($params{'hash_parent_base'});
8db49a7f 1426 # skip the file_parent if it's the same as the file_name
b7da721f
GB
1427 if (defined $params{'file_parent'}) {
1428 if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1429 delete $params{'file_parent'};
1430 } elsif ($params{'file_parent'} !~ /\.\./) {
67976c65 1431 $href .= ":/".esc_path_info($params{'file_parent'});
b7da721f
GB
1432 delete $params{'file_parent'};
1433 }
8db49a7f
GB
1434 }
1435 $href .= "..";
1436 delete $params{'hash_parent'};
1437 delete $params{'hash_parent_base'};
1438 } elsif (defined $params{'hash_parent'}) {
67976c65 1439 $href .= esc_path_info($params{'hash_parent'}). "..";
8db49a7f
GB
1440 delete $params{'hash_parent'};
1441 }
1442
67976c65 1443 $href .= esc_path_info($params{'hash_base'});
8db49a7f 1444 if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
67976c65 1445 $href .= ":/".esc_path_info($params{'file_name'});
b02bd7a6
GB
1446 delete $params{'file_name'};
1447 }
1448 delete $params{'hash'};
1449 delete $params{'hash_base'};
1450 } elsif (defined $params{'hash'}) {
67976c65 1451 $href .= esc_path_info($params{'hash'});
b02bd7a6
GB
1452 delete $params{'hash'};
1453 }
c752a0e0
GB
1454
1455 # If the action was a snapshot, we can absorb the
1456 # snapshot_format parameter too
1457 if ($is_snapshot) {
1458 my $fmt = $params{'snapshot_format'};
1459 # snapshot_format should always be defined when href()
1460 # is called, but just in case some code forgets, we
1461 # fall back to the default
1462 $fmt ||= $snapshot_fmts[0];
1463 $href .= $known_snapshot_formats{$fmt}{'suffix'};
1464 delete $params{'snapshot_format'};
1465 }
9e756904
MW
1466 }
1467
1468 # now encode the parameters explicitly
498fe002 1469 my @result = ();
1b2d297e
GB
1470 for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1471 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
498fe002 1472 if (defined $params{$name}) {
f22cca44
JN
1473 if (ref($params{$name}) eq "ARRAY") {
1474 foreach my $par (@{$params{$name}}) {
1475 push @result, $symbol . "=" . esc_param($par);
1476 }
1477 } else {
1478 push @result, $symbol . "=" . esc_param($params{$name});
1479 }
498fe002
JN
1480 }
1481 }
9e756904
MW
1482 $href .= "?" . join(';', @result) if scalar @result;
1483
67976c65
JN
1484 # final transformation: trailing spaces must be escaped (URI-encoded)
1485 $href =~ s/(\s+)$/CGI::escape($1)/e;
1486
5e96a847
KC
1487 if ($params{-anchor}) {
1488 $href .= "#".esc_param($params{-anchor});
1489 }
1490
9e756904 1491 return $href;
06a9d86b
MW
1492}
1493
1494
717b8311
JN
1495## ======================================================================
1496## validation, quoting/unquoting and escaping
1497
23faf546
KN
1498sub is_valid_action {
1499 my $input = shift;
1b2d297e 1500 return undef unless exists $actions{$input};
23faf546 1501 return 1;
1b2d297e
GB
1502}
1503
23faf546
KN
1504sub is_valid_project {
1505 my $input = shift;
1506
1507 return unless defined $input;
1508 if (!is_valid_pathname($input) ||
1b2d297e 1509 !(-d "$projectroot/$input") ||
ec26f098 1510 !check_export_ok("$projectroot/$input") ||
1b2d297e
GB
1511 ($strict_export && !project_in_list($input))) {
1512 return undef;
1513 } else {
23faf546 1514 return 1;
1b2d297e
GB
1515 }
1516}
1517
23faf546
KN
1518sub is_valid_pathname {
1519 my $input = shift;
717b8311 1520
23faf546 1521 return undef unless defined $input;
01689909 1522 # no '.' or '..' as elements of path, i.e. no '.' or '..'
24d0693a
JN
1523 # at the beginning, at the end, and between slashes.
1524 # also this catches doubled slashes
1525 if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1526 return undef;
717b8311 1527 }
24d0693a
JN
1528 # no null characters
1529 if ($input =~ m!\0!) {
717b8311
JN
1530 return undef;
1531 }
23faf546 1532 return 1;
24d0693a
JN
1533}
1534
c0bc2265 1535sub is_valid_ref_format {
23faf546 1536 my $input = shift;
c0bc2265 1537
23faf546 1538 return undef unless defined $input;
c0bc2265
KN
1539 # restrictions on ref name according to git-check-ref-format
1540 if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1541 return undef;
1542 }
23faf546 1543 return 1;
c0bc2265
KN
1544}
1545
23faf546
KN
1546sub is_valid_refname {
1547 my $input = shift;
24d0693a 1548
23faf546 1549 return undef unless defined $input;
24d0693a 1550 # textual hashes are O.K.
cfb04911 1551 if ($input =~ m/^$oid_regex$/) {
23faf546 1552 return 1;
24d0693a
JN
1553 }
1554 # it must be correct pathname
23faf546 1555 is_valid_pathname($input) or return undef;
c0bc2265 1556 # check git-check-ref-format restrictions
23faf546
KN
1557 is_valid_ref_format($input) or return undef;
1558 return 1;
717b8311
JN
1559}
1560
00f429af
MK
1561# decode sequences of octets in utf8 into Perl's internal form,
1562# which is utf-8 with utf8 flag set if needed. gitweb writes out
1563# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1564sub to_utf8 {
1565 my $str = shift;
1df48766 1566 return undef unless defined $str;
b13e3eac
JN
1567
1568 if (utf8::is_utf8($str) || utf8::decode($str)) {
e5d3de5c 1569 return $str;
00f429af
MK
1570 } else {
1571 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1572 }
1573}
1574
232ff553
KS
1575# quote unsafe chars, but keep the slash, even when it's not
1576# correct, but quoted slashes look too horrible in bookmarks
1577sub esc_param {
353347b0 1578 my $str = shift;
1df48766 1579 return undef unless defined $str;
452e2256 1580 $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
a9e60b7d 1581 $str =~ s/ /\+/g;
353347b0
KS
1582 return $str;
1583}
1584
67976c65
JN
1585# the quoting rules for path_info fragment are slightly different
1586sub esc_path_info {
1587 my $str = shift;
1588 return undef unless defined $str;
1589
1590 # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1591 $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1592
1593 return $str;
1594}
1595
22e5e58a 1596# quote unsafe chars in whole URL, so some characters cannot be quoted
f93bff8d
JN
1597sub esc_url {
1598 my $str = shift;
1df48766 1599 return undef unless defined $str;
109988f2 1600 $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
f93bff8d
JN
1601 $str =~ s/ /\+/g;
1602 return $str;
1603}
1604
3017ed62
JN
1605# quote unsafe characters in HTML attributes
1606sub esc_attr {
1607
1608 # for XHTML conformance escaping '"' to '&quot;' is not enough
1609 return esc_html(@_);
1610}
1611
232ff553 1612# replace invalid utf8 character with SUBSTITUTION sequence
74fd8728 1613sub esc_html {
40c13813 1614 my $str = shift;
6255ef08
JN
1615 my %opts = @_;
1616
1df48766
JN
1617 return undef unless defined $str;
1618
00f429af 1619 $str = to_utf8($str);
c390ae97 1620 $str = $cgi->escapeHTML($str);
6255ef08
JN
1621 if ($opts{'-nbsp'}) {
1622 $str =~ s/ /&nbsp;/g;
1623 }
25ffbb27 1624 $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
40c13813
KS
1625 return $str;
1626}
1627
391862e3
JN
1628# quote control characters and escape filename to HTML
1629sub esc_path {
1630 my $str = shift;
1631 my %opts = @_;
1632
1df48766
JN
1633 return undef unless defined $str;
1634
00f429af 1635 $str = to_utf8($str);
c390ae97 1636 $str = $cgi->escapeHTML($str);
391862e3
JN
1637 if ($opts{'-nbsp'}) {
1638 $str =~ s/ /&nbsp;/g;
1639 }
1640 $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1641 return $str;
1642}
1643
26547bfb 1644# Sanitize for use in XHTML + application/xml+xhtml (valid XML 1.0)
0866786b
JN
1645sub sanitize {
1646 my $str = shift;
1647
1648 return undef unless defined $str;
1649
1650 $str = to_utf8($str);
0e901d24 1651 $str =~ s|([[:cntrl:]])|(index("\t\n\r", $1) != -1 ? $1 : quot_cec($1))|eg;
0866786b
JN
1652 return $str;
1653}
1654
391862e3 1655# Make control characters "printable", using character escape codes (CEC)
1d3bc0cc
JN
1656sub quot_cec {
1657 my $cntrl = shift;
c84c483f 1658 my %opts = @_;
1d3bc0cc 1659 my %es = ( # character escape codes, aka escape sequences
c84c483f
JN
1660 "\t" => '\t', # tab (HT)
1661 "\n" => '\n', # line feed (LF)
1662 "\r" => '\r', # carrige return (CR)
1663 "\f" => '\f', # form feed (FF)
1664 "\b" => '\b', # backspace (BS)
1665 "\a" => '\a', # alarm (bell) (BEL)
1666 "\e" => '\e', # escape (ESC)
1667 "\013" => '\v', # vertical tab (VT)
1668 "\000" => '\0', # nul character (NUL)
1669 );
1d3bc0cc
JN
1670 my $chr = ( (exists $es{$cntrl})
1671 ? $es{$cntrl}
25dfd171 1672 : sprintf('\%2x', ord($cntrl)) );
c84c483f
JN
1673 if ($opts{-nohtml}) {
1674 return $chr;
1675 } else {
1676 return "<span class=\"cntrl\">$chr</span>";
1677 }
1d3bc0cc
JN
1678}
1679
391862e3
JN
1680# Alternatively use unicode control pictures codepoints,
1681# Unicode "printable representation" (PR)
1d3bc0cc
JN
1682sub quot_upr {
1683 my $cntrl = shift;
c84c483f
JN
1684 my %opts = @_;
1685
1d3bc0cc 1686 my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
c84c483f
JN
1687 if ($opts{-nohtml}) {
1688 return $chr;
1689 } else {
1690 return "<span class=\"cntrl\">$chr</span>";
1691 }
1d3bc0cc
JN
1692}
1693
232ff553
KS
1694# git may return quoted and escaped filenames
1695sub unquote {
1696 my $str = shift;
403d0906
JN
1697
1698 sub unq {
1699 my $seq = shift;
1700 my %es = ( # character escape codes, aka escape sequences
1701 't' => "\t", # tab (HT, TAB)
1702 'n' => "\n", # newline (NL)
1703 'r' => "\r", # return (CR)
1704 'f' => "\f", # form feed (FF)
1705 'b' => "\b", # backspace (BS)
1706 'a' => "\a", # alarm (bell) (BEL)
1707 'e' => "\e", # escape (ESC)
1708 'v' => "\013", # vertical tab (VT)
1709 );
1710
1711 if ($seq =~ m/^[0-7]{1,3}$/) {
1712 # octal char sequence
1713 return chr(oct($seq));
1714 } elsif (exists $es{$seq}) {
1715 # C escape sequence, aka character escape code
c84c483f 1716 return $es{$seq};
403d0906
JN
1717 }
1718 # quoted ordinary character
1719 return $seq;
1720 }
1721
232ff553 1722 if ($str =~ m/^"(.*)"$/) {
403d0906 1723 # needs unquoting
232ff553 1724 $str = $1;
403d0906 1725 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
232ff553
KS
1726 }
1727 return $str;
1728}
1729
f16db173
JN
1730# escape tabs (convert tabs to spaces)
1731sub untabify {
1732 my $line = shift;
1733
1734 while ((my $pos = index($line, "\t")) != -1) {
1735 if (my $count = (8 - ($pos % 8))) {
1736 my $spaces = ' ' x $count;
1737 $line =~ s/\t/$spaces/;
1738 }
1739 }
1740
1741 return $line;
1742}
1743
32f4aacc
ML
1744sub project_in_list {
1745 my $project = shift;
1746 my @list = git_get_projects_list();
1747 return @list && scalar(grep { $_->{'path'} eq $project } @list);
1748}
1749
717b8311
JN
1750## ----------------------------------------------------------------------
1751## HTML aware string manipulation
1752
b8d97d07
JN
1753# Try to chop given string on a word boundary between position
1754# $len and $len+$add_len. If there is no word boundary there,
1755# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1756# (marking chopped part) would be longer than given string.
717b8311
JN
1757sub chop_str {
1758 my $str = shift;
1759 my $len = shift;
1760 my $add_len = shift || 10;
b8d97d07 1761 my $where = shift || 'right'; # 'left' | 'center' | 'right'
717b8311 1762
dee2775a
AW
1763 # Make sure perl knows it is utf8 encoded so we don't
1764 # cut in the middle of a utf8 multibyte char.
1765 $str = to_utf8($str);
1766
717b8311
JN
1767 # allow only $len chars, but don't cut a word if it would fit in $add_len
1768 # if it doesn't fit, cut it if it's still longer than the dots we would add
b8d97d07
JN
1769 # remove chopped character entities entirely
1770
1771 # when chopping in the middle, distribute $len into left and right part
1772 # return early if chopping wouldn't make string shorter
1773 if ($where eq 'center') {
1774 return $str if ($len + 5 >= length($str)); # filler is length 5
1775 $len = int($len/2);
1776 } else {
1777 return $str if ($len + 4 >= length($str)); # filler is length 4
1778 }
1779
1780 # regexps: ending and beginning with word part up to $add_len
1781 my $endre = qr/.{$len}\w{0,$add_len}/;
1782 my $begre = qr/\w{0,$add_len}.{$len}/;
1783
1784 if ($where eq 'left') {
1785 $str =~ m/^(.*?)($begre)$/;
1786 my ($lead, $body) = ($1, $2);
1787 if (length($lead) > 4) {
b8d97d07
JN
1788 $lead = " ...";
1789 }
1790 return "$lead$body";
1791
1792 } elsif ($where eq 'center') {
1793 $str =~ m/^($endre)(.*)$/;
1794 my ($left, $str) = ($1, $2);
1795 $str =~ m/^(.*?)($begre)$/;
1796 my ($mid, $right) = ($1, $2);
1797 if (length($mid) > 5) {
b8d97d07
JN
1798 $mid = " ... ";
1799 }
1800 return "$left$mid$right";
1801
1802 } else {
1803 $str =~ m/^($endre)(.*)$/;
1804 my $body = $1;
1805 my $tail = $2;
1806 if (length($tail) > 4) {
b8d97d07
JN
1807 $tail = "... ";
1808 }
1809 return "$body$tail";
717b8311 1810 }
717b8311
JN
1811}
1812
ce58ec91
DS
1813# takes the same arguments as chop_str, but also wraps a <span> around the
1814# result with a title attribute if it does get chopped. Additionally, the
1815# string is HTML-escaped.
1816sub chop_and_escape_str {
b8d97d07 1817 my ($str) = @_;
ce58ec91 1818
b8d97d07 1819 my $chopped = chop_str(@_);
168c1e01 1820 $str = to_utf8($str);
ce58ec91
DS
1821 if ($chopped eq $str) {
1822 return esc_html($chopped);
1823 } else {
14afe774 1824 $str =~ s/[[:cntrl:]]/?/g;
850b90a5 1825 return $cgi->span({-title=>$str}, esc_html($chopped));
ce58ec91
DS
1826 }
1827}
1828
337da8d2
JN
1829# Highlight selected fragments of string, using given CSS class,
1830# and escape HTML. It is assumed that fragments do not overlap.
1831# Regions are passed as list of pairs (array references).
1832#
1833# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1834# '<span class="mark">foo</span>bar'
1835sub esc_html_hl_regions {
1836 my ($str, $css_class, @sel) = @_;
9768a9d8
JN
1837 my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1838 @sel = grep { ref($_) eq 'ARRAY' } @sel;
1839 return esc_html($str, %opts) unless @sel;
337da8d2
JN
1840
1841 my $out = '';
1842 my $pos = 0;
1843
1844 for my $s (@sel) {
ce61fb96 1845 my ($begin, $end) = @$s;
337da8d2 1846
cbbea3df
MK
1847 # Don't create empty <span> elements.
1848 next if $end <= $begin;
1849
9768a9d8
JN
1850 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1851 %opts);
ce61fb96 1852
9768a9d8 1853 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
ce61fb96
MK
1854 if ($begin - $pos > 0);
1855 $out .= $cgi->span({-class => $css_class}, $escaped);
1856
1857 $pos = $end;
337da8d2 1858 }
9768a9d8 1859 $out .= esc_html(substr($str, $pos), %opts)
337da8d2
JN
1860 if ($pos < length($str));
1861
1862 return $out;
1863}
1864
e607b79f
JN
1865# return positions of beginning and end of each match
1866sub matchpos_list {
337da8d2 1867 my ($str, $regexp) = @_;
e607b79f 1868 return unless (defined $str && defined $regexp);
337da8d2
JN
1869
1870 my @matches;
1871 while ($str =~ /$regexp/g) {
1872 push @matches, [$-[0], $+[0]];
1873 }
e607b79f
JN
1874 return @matches;
1875}
1876
1877# highlight match (if any), and escape HTML
1878sub esc_html_match_hl {
1879 my ($str, $regexp) = @_;
1880 return esc_html($str) unless defined $regexp;
1881
1882 my @matches = matchpos_list($str, $regexp);
337da8d2
JN
1883 return esc_html($str) unless @matches;
1884
1885 return esc_html_hl_regions($str, 'match', @matches);
1886}
1887
e607b79f
JN
1888
1889# highlight match (if any) of shortened string, and escape HTML
1890sub esc_html_match_hl_chopped {
1891 my ($str, $chopped, $regexp) = @_;
1892 return esc_html_match_hl($str, $regexp) unless defined $chopped;
1893
1894 my @matches = matchpos_list($str, $regexp);
1895 return esc_html($chopped) unless @matches;
1896
1897 # filter matches so that we mark chopped string
1898 my $tail = "... "; # see chop_str
1899 unless ($chopped =~ s/\Q$tail\E$//) {
1900 $tail = '';
1901 }
1902 my $chop_len = length($chopped);
1903 my $tail_len = length($tail);
1904 my @filtered;
1905
1906 for my $m (@matches) {
1907 if ($m->[0] > $chop_len) {
1908 push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1909 last;
1910 } elsif ($m->[1] > $chop_len) {
1911 push @filtered, [ $m->[0], $chop_len + $tail_len ];
1912 last;
1913 }
1914 push @filtered, $m;
1915 }
1916
1917 return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1918}
1919
717b8311
JN
1920## ----------------------------------------------------------------------
1921## functions returning short strings
1922
1f1ab5f0
JN
1923# CSS class for given age value (in seconds)
1924sub age_class {
1925 my $age = shift;
1926
785cdea9
JN
1927 if (!defined $age) {
1928 return "noage";
1929 } elsif ($age < 60*60*2) {
1f1ab5f0
JN
1930 return "age0";
1931 } elsif ($age < 60*60*24*2) {
1932 return "age1";
1933 } else {
1934 return "age2";
1935 }
1936}
1937
717b8311
JN
1938# convert age in seconds to "nn units ago" string
1939sub age_string {
1940 my $age = shift;
1941 my $age_str;
a59d4afd 1942
717b8311
JN
1943 if ($age > 60*60*24*365*2) {
1944 $age_str = (int $age/60/60/24/365);
1945 $age_str .= " years ago";
1946 } elsif ($age > 60*60*24*(365/12)*2) {
1947 $age_str = int $age/60/60/24/(365/12);
1948 $age_str .= " months ago";
1949 } elsif ($age > 60*60*24*7*2) {
1950 $age_str = int $age/60/60/24/7;
1951 $age_str .= " weeks ago";
1952 } elsif ($age > 60*60*24*2) {
1953 $age_str = int $age/60/60/24;
1954 $age_str .= " days ago";
1955 } elsif ($age > 60*60*2) {
1956 $age_str = int $age/60/60;
1957 $age_str .= " hours ago";
1958 } elsif ($age > 60*2) {
1959 $age_str = int $age/60;
1960 $age_str .= " min ago";
1961 } elsif ($age > 2) {
1962 $age_str = int $age;
1963 $age_str .= " sec ago";
f6801d66 1964 } else {
717b8311 1965 $age_str .= " right now";
4c02e3c5 1966 }
717b8311 1967 return $age_str;
161332a5
KS
1968}
1969
01ac1e38
JN
1970use constant {
1971 S_IFINVALID => 0030000,
1972 S_IFGITLINK => 0160000,
1973};
1974
1975# submodule/subproject, a commit object reference
74fd8728 1976sub S_ISGITLINK {
01ac1e38
JN
1977 my $mode = shift;
1978
1979 return (($mode & S_IFMT) == S_IFGITLINK)
1980}
1981
717b8311
JN
1982# convert file mode in octal to symbolic file mode string
1983sub mode_str {
1984 my $mode = oct shift;
1985
01ac1e38
JN
1986 if (S_ISGITLINK($mode)) {
1987 return 'm---------';
1988 } elsif (S_ISDIR($mode & S_IFMT)) {
717b8311
JN
1989 return 'drwxr-xr-x';
1990 } elsif (S_ISLNK($mode)) {
1991 return 'lrwxrwxrwx';
1992 } elsif (S_ISREG($mode)) {
1993 # git cares only about the executable bit
1994 if ($mode & S_IXUSR) {
1995 return '-rwxr-xr-x';
1996 } else {
1997 return '-rw-r--r--';
1998 };
c994d620 1999 } else {
717b8311 2000 return '----------';
ff7669a5 2001 }
161332a5
KS
2002}
2003
717b8311
JN
2004# convert file mode in octal to file type string
2005sub file_type {
7c5e2ebb
JN
2006 my $mode = shift;
2007
2008 if ($mode !~ m/^[0-7]+$/) {
2009 return $mode;
2010 } else {
2011 $mode = oct $mode;
2012 }
664f4cc5 2013
01ac1e38
JN
2014 if (S_ISGITLINK($mode)) {
2015 return "submodule";
2016 } elsif (S_ISDIR($mode & S_IFMT)) {
717b8311
JN
2017 return "directory";
2018 } elsif (S_ISLNK($mode)) {
2019 return "symlink";
2020 } elsif (S_ISREG($mode)) {
2021 return "file";
2022 } else {
2023 return "unknown";
2024 }
a59d4afd
KS
2025}
2026
744d0ac3
JN
2027# convert file mode in octal to file type description string
2028sub file_type_long {
2029 my $mode = shift;
2030
2031 if ($mode !~ m/^[0-7]+$/) {
2032 return $mode;
2033 } else {
2034 $mode = oct $mode;
2035 }
2036
01ac1e38
JN
2037 if (S_ISGITLINK($mode)) {
2038 return "submodule";
2039 } elsif (S_ISDIR($mode & S_IFMT)) {
744d0ac3
JN
2040 return "directory";
2041 } elsif (S_ISLNK($mode)) {
2042 return "symlink";
2043 } elsif (S_ISREG($mode)) {
2044 if ($mode & S_IXUSR) {
2045 return "executable";
2046 } else {
2047 return "file";
2048 };
2049 } else {
2050 return "unknown";
2051 }
2052}
2053
2054
717b8311
JN
2055## ----------------------------------------------------------------------
2056## functions returning short HTML fragments, or transforming HTML fragments
3dff5379 2057## which don't belong to other sections
b18f9bf4 2058
225932ed 2059# format line of commit message.
717b8311
JN
2060sub format_log_line_html {
2061 my $line = shift;
b18f9bf4 2062
cfb04911 2063 # Potentially abbreviated OID.
2064 my $regex = oid_nlen_regex("7,64");
2065
225932ed 2066 $line = esc_html($line, -nbsp=>1);
cf5c7253
ÆAB
2067 $line =~ s{
2068 \b
2069 (
2070 # The output of "git describe", e.g. v2.10.0-297-gf6727b0
2071 # or hadoop-20160921-113441-20-g094fb7d
2072 (?<!-) # see strbuf_check_tag_ref(). Tags can't start with -
2073 [A-Za-z0-9.-]+
2074 (?!\.) # refs can't end with ".", see check_refname_format()
cfb04911 2075 -g$regex
cf5c7253
ÆAB
2076 |
2077 # Just a normal looking Git SHA1
cfb04911 2078 $regex
cf5c7253
ÆAB
2079 )
2080 \b
2081 }{
7d233dea
MC
2082 $cgi->a({-href => href(action=>"object", hash=>$1),
2083 -class => "text"}, $1);
cf5c7253 2084 }egx;
7d233dea 2085
717b8311 2086 return $line;
b18f9bf4
JN
2087}
2088
717b8311 2089# format marker of refs pointing to given object
4afbaeff
GB
2090
2091# the destination action is chosen based on object type and current context:
2092# - for annotated tags, we choose the tag view unless it's the current view
2093# already, in which case we go to shortlog view
2094# - for other refs, we keep the current view if we're in history, shortlog or
2095# log view, and select shortlog otherwise
847e01fb 2096sub format_ref_marker {
717b8311 2097 my ($refs, $id) = @_;
d294e1ca 2098 my $markers = '';
27fb8c40 2099
717b8311 2100 if (defined $refs->{$id}) {
d294e1ca 2101 foreach my $ref (@{$refs->{$id}}) {
4afbaeff
GB
2102 # this code exploits the fact that non-lightweight tags are the
2103 # only indirect objects, and that they are the only objects for which
2104 # we want to use tag instead of shortlog as action
d294e1ca 2105 my ($type, $name) = qw();
4afbaeff 2106 my $indirect = ($ref =~ s/\^\{\}$//);
d294e1ca
JN
2107 # e.g. tags/v2.6.11 or heads/next
2108 if ($ref =~ m!^(.*?)s?/(.*)$!) {
2109 $type = $1;
2110 $name = $2;
2111 } else {
2112 $type = "ref";
2113 $name = $ref;
2114 }
2115
4afbaeff
GB
2116 my $class = $type;
2117 $class .= " indirect" if $indirect;
2118
2119 my $dest_action = "shortlog";
2120
2121 if ($indirect) {
2122 $dest_action = "tag" unless $action eq "tag";
2123 } elsif ($action =~ /^(history|(short)?log)$/) {
2124 $dest_action = $action;
2125 }
2126
2127 my $dest = "";
2128 $dest .= "refs/" unless $ref =~ m!^refs/!;
2129 $dest .= $ref;
2130
2131 my $link = $cgi->a({
2132 -href => href(
2133 action=>$dest_action,
2134 hash=>$dest
77947bbe 2135 )}, esc_html($name));
4afbaeff 2136
3017ed62 2137 $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
4afbaeff 2138 $link . "</span>";
d294e1ca
JN
2139 }
2140 }
2141
2142 if ($markers) {
2143 return ' <span class="refs">'. $markers . '</span>';
717b8311
JN
2144 } else {
2145 return "";
2146 }
27fb8c40
JN
2147}
2148
17d07443
JN
2149# format, perhaps shortened and with markers, title line
2150sub format_subject_html {
1c2a4f5a 2151 my ($long, $short, $href, $extra) = @_;
17d07443
JN
2152 $extra = '' unless defined($extra);
2153
2154 if (length($short) < length($long)) {
14afe774 2155 $long =~ s/[[:cntrl:]]/?/g;
7c278014 2156 return $cgi->a({-href => $href, -class => "list subject",
00f429af 2157 -title => to_utf8($long)},
01b89f0c 2158 esc_html($short)) . $extra;
17d07443 2159 } else {
7c278014 2160 return $cgi->a({-href => $href, -class => "list subject"},
01b89f0c 2161 esc_html($long)) . $extra;
17d07443
JN
2162 }
2163}
2164
5a371b7b
GB
2165# Rather than recomputing the url for an email multiple times, we cache it
2166# after the first hit. This gives a visible benefit in views where the avatar
2167# for the same email is used repeatedly (e.g. shortlog).
2168# The cache is shared by all avatar engines (currently gravatar only), which
2169# are free to use it as preferred. Since only one avatar engine is used for any
2170# given page, there's no risk for cache conflicts.
2171our %avatar_cache = ();
2172
679a1a1d
GB
2173# Compute the picon url for a given email, by using the picon search service over at
2174# http://www.cs.indiana.edu/picons/search.html
2175sub picon_url {
2176 my $email = lc shift;
2177 if (!$avatar_cache{$email}) {
2178 my ($user, $domain) = split('@', $email);
2179 $avatar_cache{$email} =
57485581 2180 "//www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
679a1a1d
GB
2181 "$domain/$user/" .
2182 "users+domains+unknown/up/single";
2183 }
2184 return $avatar_cache{$email};
2185}
2186
5a371b7b
GB
2187# Compute the gravatar url for a given email, if it's not in the cache already.
2188# Gravatar stores only the part of the URL before the size, since that's the
2189# one computationally more expensive. This also allows reuse of the cache for
2190# different sizes (for this particular engine).
2191sub gravatar_url {
2192 my $email = lc shift;
2193 my $size = shift;
2194 $avatar_cache{$email} ||=
57485581 2195 "//www.gravatar.com/avatar/" .
7d5b30e0 2196 md5_hex($email) . "?s=";
5a371b7b
GB
2197 return $avatar_cache{$email} . $size;
2198}
2199
e9fdd74e
GB
2200# Insert an avatar for the given $email at the given $size if the feature
2201# is enabled.
2202sub git_get_avatar {
2203 my ($email, %opts) = @_;
2204 my $pre_white = ($opts{-pad_before} ? "&nbsp;" : "");
2205 my $post_white = ($opts{-pad_after} ? "&nbsp;" : "");
2206 $opts{-size} ||= 'default';
2207 my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2208 my $url = "";
2209 if ($git_avatar eq 'gravatar') {
5a371b7b 2210 $url = gravatar_url($email, $size);
679a1a1d
GB
2211 } elsif ($git_avatar eq 'picon') {
2212 $url = picon_url($email);
e9fdd74e 2213 }
679a1a1d 2214 # Other providers can be added by extending the if chain, defining $url
e9fdd74e
GB
2215 # as needed. If no variant puts something in $url, we assume avatars
2216 # are completely disabled/unavailable.
2217 if ($url) {
2218 return $pre_white .
2219 "<img width=\"$size\" " .
2220 "class=\"avatar\" " .
3017ed62 2221 "src=\"".esc_url($url)."\" " .
7d25ef41 2222 "alt=\"\" " .
e9fdd74e
GB
2223 "/>" . $post_white;
2224 } else {
2225 return "";
2226 }
2227}
2228
e133d65c
SB
2229sub format_search_author {
2230 my ($author, $searchtype, $displaytext) = @_;
2231 my $have_search = gitweb_check_feature('search');
2232
2233 if ($have_search) {
2234 my $performed = "";
2235 if ($searchtype eq 'author') {
2236 $performed = "authored";
2237 } elsif ($searchtype eq 'committer') {
2238 $performed = "committed";
2239 }
2240
2241 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2242 searchtext=>$author,
2243 searchtype=>$searchtype), class=>"list",
2244 title=>"Search for commits $performed by $author"},
2245 $displaytext);
2246
2247 } else {
2248 return $displaytext;
2249 }
2250}
2251
1c49a4e1
GB
2252# format the author name of the given commit with the given tag
2253# the author name is chopped and escaped according to the other
2254# optional parameters (see chop_str).
2255sub format_author_html {
2256 my $tag = shift;
2257 my $co = shift;
2258 my $author = chop_and_escape_str($co->{'author_name'}, @_);
e9fdd74e 2259 return "<$tag class=\"author\">" .
e133d65c
SB
2260 format_search_author($co->{'author_name'}, "author",
2261 git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2262 $author) .
2263 "</$tag>";
1c49a4e1
GB
2264}
2265
90921740
JN
2266# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2267sub format_git_diff_header_line {
2268 my $line = shift;
2269 my $diffinfo = shift;
2270 my ($from, $to) = @_;
2271
2272 if ($diffinfo->{'nparents'}) {
2273 # combined diff
2274 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2275 if ($to->{'href'}) {
2276 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2277 esc_path($to->{'file'}));
2278 } else { # file was deleted (no href)
2279 $line .= esc_path($to->{'file'});
2280 }
2281 } else {
2282 # "ordinary" diff
2283 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2284 if ($from->{'href'}) {
2285 $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2286 'a/' . esc_path($from->{'file'}));
2287 } else { # file was added (no href)
2288 $line .= 'a/' . esc_path($from->{'file'});
2289 }
2290 $line .= ' ';
2291 if ($to->{'href'}) {
2292 $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2293 'b/' . esc_path($to->{'file'}));
2294 } else { # file was deleted
2295 $line .= 'b/' . esc_path($to->{'file'});
2296 }
2297 }
2298
2299 return "<div class=\"diff header\">$line</div>\n";
2300}
2301
2302# format extended diff header line, before patch itself
2303sub format_extended_diff_header_line {
2304 my $line = shift;
2305 my $diffinfo = shift;
2306 my ($from, $to) = @_;
2307
2308 # match <path>
2309 if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2310 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2311 esc_path($from->{'file'}));
2312 }
2313 if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2314 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2315 esc_path($to->{'file'}));
2316 }
2317 # match single <mode>
2318 if ($line =~ m/\s(\d{6})$/) {
2319 $line .= '<span class="info"> (' .
2320 file_type_long($1) .
2321 ')</span>';
2322 }
2323 # match <hash>
cfb04911 2324 if ($line =~ oid_nlen_prefix_infix_regex($sha1_len, "index ", ",") |
2325 $line =~ oid_nlen_prefix_infix_regex($sha256_len, "index ", ",")) {
90921740
JN
2326 # can match only for combined diff
2327 $line = 'index ';
2328 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2329 if ($from->{'href'}[$i]) {
2330 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2331 -class=>"hash"},
2332 substr($diffinfo->{'from_id'}[$i],0,7));
2333 } else {
2334 $line .= '0' x 7;
2335 }
2336 # separator
2337 $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2338 }
2339 $line .= '..';
2340 if ($to->{'href'}) {
2341 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2342 substr($diffinfo->{'to_id'},0,7));
2343 } else {
2344 $line .= '0' x 7;
2345 }
2346
cfb04911 2347 } elsif ($line =~ oid_nlen_prefix_infix_regex($sha1_len, "index ", "..") |
2348 $line =~ oid_nlen_prefix_infix_regex($sha256_len, "index ", "..")) {
90921740
JN
2349 # can match only for ordinary diff
2350 my ($from_link, $to_link);
2351 if ($from->{'href'}) {
2352 $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2353 substr($diffinfo->{'from_id'},0,7));
2354 } else {
2355 $from_link = '0' x 7;
2356 }
2357 if ($to->{'href'}) {
2358 $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2359 substr($diffinfo->{'to_id'},0,7));
2360 } else {
2361 $to_link = '0' x 7;
2362 }
2363 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2364 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2365 }
2366
2367 return $line . "<br/>\n";
2368}
2369
2370# format from-file/to-file diff header
2371sub format_diff_from_to_header {
91af4ce4 2372 my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
90921740
JN
2373 my $line;
2374 my $result = '';
2375
2376 $line = $from_line;
2377 #assert($line =~ m/^---/) if DEBUG;
deaa01a9
JN
2378 # no extra formatting for "^--- /dev/null"
2379 if (! $diffinfo->{'nparents'}) {
2380 # ordinary (single parent) diff
2381 if ($line =~ m!^--- "?a/!) {
2382 if ($from->{'href'}) {
2383 $line = '--- a/' .
2384 $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2385 esc_path($from->{'file'}));
2386 } else {
2387 $line = '--- a/' .
2388 esc_path($from->{'file'});
2389 }
2390 }
2391 $result .= qq!<div class="diff from_file">$line</div>\n!;
2392
2393 } else {
2394 # combined diff (merge commit)
2395 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2396 if ($from->{'href'}[$i]) {
2397 $line = '--- ' .
91af4ce4
JN
2398 $cgi->a({-href=>href(action=>"blobdiff",
2399 hash_parent=>$diffinfo->{'from_id'}[$i],
2400 hash_parent_base=>$parents[$i],
2401 file_parent=>$from->{'file'}[$i],
2402 hash=>$diffinfo->{'to_id'},
2403 hash_base=>$hash,
2404 file_name=>$to->{'file'}),
2405 -class=>"path",
2406 -title=>"diff" . ($i+1)},
2407 $i+1) .
2408 '/' .
deaa01a9
JN
2409 $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2410 esc_path($from->{'file'}[$i]));
2411 } else {
2412 $line = '--- /dev/null';
2413 }
2414 $result .= qq!<div class="diff from_file">$line</div>\n!;
90921740
JN
2415 }
2416 }
90921740
JN
2417
2418 $line = $to_line;
2419 #assert($line =~ m/^\+\+\+/) if DEBUG;
2420 # no extra formatting for "^+++ /dev/null"
2421 if ($line =~ m!^\+\+\+ "?b/!) {
2422 if ($to->{'href'}) {
2423 $line = '+++ b/' .
2424 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2425 esc_path($to->{'file'}));
2426 } else {
2427 $line = '+++ b/' .
2428 esc_path($to->{'file'});
2429 }
2430 }
2431 $result .= qq!<div class="diff to_file">$line</div>\n!;
2432
2433 return $result;
2434}
2435
cd030c3a
JN
2436# create note for patch simplified by combined diff
2437sub format_diff_cc_simplified {
2438 my ($diffinfo, @parents) = @_;
2439 my $result = '';
2440
2441 $result .= "<div class=\"diff header\">" .
2442 "diff --cc ";
2443 if (!is_deleted($diffinfo)) {
2444 $result .= $cgi->a({-href => href(action=>"blob",
2445 hash_base=>$hash,
2446 hash=>$diffinfo->{'to_id'},
2447 file_name=>$diffinfo->{'to_file'}),
2448 -class => "path"},
2449 esc_path($diffinfo->{'to_file'}));
2450 } else {
2451 $result .= esc_path($diffinfo->{'to_file'});
2452 }
2453 $result .= "</div>\n" . # class="diff header"
2454 "<div class=\"diff nodifferences\">" .
2455 "Simple merge" .
2456 "</div>\n"; # class="diff nodifferences"
2457
2458 return $result;
2459}
2460
20a864cd
JN
2461sub diff_line_class {
2462 my ($line, $from, $to) = @_;
2463
2464 # ordinary diff
2465 my $num_sign = 1;
2466 # combined diff
2467 if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2468 $num_sign = scalar @{$from->{'href'}};
2469 }
2470
2471 my @diff_line_classifier = (
2472 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2473 { regexp => qr/^\\/, class => "incomplete" },
2474 { regexp => qr/^ {$num_sign}/, class => "ctx" },
2475 # classifier for context must come before classifier add/rem,
2476 # or we would have to use more complicated regexp, for example
2477 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2478 { regexp => qr/^[+ ]{$num_sign}/, class => "add" },
2479 { regexp => qr/^[- ]{$num_sign}/, class => "rem" },
2480 );
2481 for my $clsfy (@diff_line_classifier) {
2482 return $clsfy->{'class'}
2483 if ($line =~ $clsfy->{'regexp'});
2484 }
2485
2486 # fallback
2487 return "";
2488}
2489
f1310cf5
JN
2490# assumes that $from and $to are defined and correctly filled,
2491# and that $line holds a line of chunk header for unified diff
2492sub format_unidiff_chunk_header {
2493 my ($line, $from, $to) = @_;
2494
2495 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2496 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2497
2498 $from_lines = 0 unless defined $from_lines;
2499 $to_lines = 0 unless defined $to_lines;
2500
2501 if ($from->{'href'}) {
2502 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2503 -class=>"list"}, $from_text);
2504 }
2505 if ($to->{'href'}) {
2506 $to_text = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2507 -class=>"list"}, $to_text);
2508 }
2509 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2510 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2511 return $line;
2512}
2513
2514# assumes that $from and $to are defined and correctly filled,
2515# and that $line holds a line of chunk header for combined diff
2516sub format_cc_diff_chunk_header {
2517 my ($line, $from, $to) = @_;
2518
2519 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2520 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2521
2522 @from_text = split(' ', $ranges);
2523 for (my $i = 0; $i < @from_text; ++$i) {
2524 ($from_start[$i], $from_nlines[$i]) =
2525 (split(',', substr($from_text[$i], 1)), 0);
2526 }
2527
2528 $to_text = pop @from_text;
2529 $to_start = pop @from_start;
2530 $to_nlines = pop @from_nlines;
2531
2532 $line = "<span class=\"chunk_info\">$prefix ";
2533 for (my $i = 0; $i < @from_text; ++$i) {
2534 if ($from->{'href'}[$i]) {
2535 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2536 -class=>"list"}, $from_text[$i]);
2537 } else {
2538 $line .= $from_text[$i];
2539 }
2540 $line .= " ";
2541 }
2542 if ($to->{'href'}) {
2543 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2544 -class=>"list"}, $to_text);
2545 } else {
2546 $line .= $to_text;
2547 }
2548 $line .= " $prefix</span>" .
2549 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2550 return $line;
2551}
2552
6ba1eb51 2553# process patch (diff) line (not to be used for diff headers),
5fb6ddf6
MK
2554# returning HTML-formatted (but not wrapped) line.
2555# If the line is passed as a reference, it is treated as HTML and not
2556# esc_html()'ed.
f4a81026
MK
2557sub format_diff_line {
2558 my ($line, $diff_class, $from, $to) = @_;
eee08903 2559
5fb6ddf6
MK
2560 if (ref($line)) {
2561 $line = $$line;
f4a81026 2562 } else {
5fb6ddf6
MK
2563 chomp $line;
2564 $line = untabify($line);
20a864cd 2565
5fb6ddf6
MK
2566 if ($from && $to && $line =~ m/^\@{2} /) {
2567 $line = format_unidiff_chunk_header($line, $from, $to);
2568 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2569 $line = format_cc_diff_chunk_header($line, $from, $to);
2570 } else {
2571 $line = esc_html($line, -nbsp=>1);
2572 }
59e3b14e 2573 }
e72c0eaf 2574
f4a81026
MK
2575 my $diff_classes = "diff";
2576 $diff_classes .= " $diff_class" if ($diff_class);
2577 $line = "<div class=\"$diff_classes\">$line</div>\n";
f1310cf5 2578
f4a81026 2579 return $line;
eee08903
JN
2580}
2581
a3c8ab30
MM
2582# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2583# linked. Pass the hash of the tree/commit to snapshot.
2584sub format_snapshot_links {
2585 my ($hash) = @_;
a3c8ab30
MM
2586 my $num_fmts = @snapshot_fmts;
2587 if ($num_fmts > 1) {
2588 # A parenthesized list of links bearing format names.
a781785d 2589 # e.g. "snapshot (_tar.gz_ _zip_)"
a3c8ab30
MM
2590 return "snapshot (" . join(' ', map
2591 $cgi->a({
2592 -href => href(
2593 action=>"snapshot",
2594 hash=>$hash,
2595 snapshot_format=>$_
2596 )
2597 }, $known_snapshot_formats{$_}{'display'})
2598 , @snapshot_fmts) . ")";
2599 } elsif ($num_fmts == 1) {
2600 # A single "snapshot" link whose tooltip bears the format name.
a781785d 2601 # i.e. "_snapshot_"
a3c8ab30 2602 my ($fmt) = @snapshot_fmts;
a781785d
JN
2603 return
2604 $cgi->a({
a3c8ab30
MM
2605 -href => href(
2606 action=>"snapshot",
2607 hash=>$hash,
2608 snapshot_format=>$fmt
2609 ),
2610 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2611 }, "snapshot");
2612 } else { # $num_fmts == 0
2613 return undef;
2614 }
2615}
2616
3562198b
JN
2617## ......................................................................
2618## functions returning values to be passed, perhaps after some
2619## transformation, to other functions; e.g. returning arguments to href()
2620
2621# returns hash to be passed to href to generate gitweb URL
2622# in -title key it returns description of link
2623sub get_feed_info {
2624 my $format = shift || 'Atom';
2625 my %res = (action => lc($format));
8d646a9b 2626 my $matched_ref = 0;
3562198b
JN
2627
2628 # feed links are possible only for project views
2629 return unless (defined $project);
2630 # some views should link to OPML, or to generic project feed,
2631 # or don't have specific feed yet (so they should use generic)
18ab83e8 2632 return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
3562198b 2633
8d646a9b
KN
2634 my $branch = undef;
2635 # branches refs uses 'refs/' + $get_branch_refs()[x] + '/' prefix
2636 # (fullname) to differentiate from tag links; this also makes
2637 # possible to detect branch links
2638 for my $ref (get_branch_refs()) {
2639 if ((defined $hash_base && $hash_base =~ m!^refs/\Q$ref\E/(.*)$!) ||
2640 (defined $hash && $hash =~ m!^refs/\Q$ref\E/(.*)$!)) {
2641 $branch = $1;
2642 $matched_ref = $ref;
2643 last;
2644 }
3562198b
JN
2645 }
2646 # find log type for feed description (title)
2647 my $type = 'log';
2648 if (defined $file_name) {
2649 $type = "history of $file_name";
2650 $type .= "/" if ($action eq 'tree');
2651 $type .= " on '$branch'" if (defined $branch);
2652 } else {
2653 $type = "log of $branch" if (defined $branch);
2654 }
2655
2656 $res{-title} = $type;
8d646a9b 2657 $res{'hash'} = (defined $branch ? "refs/$matched_ref/$branch" : undef);
3562198b
JN
2658 $res{'file_name'} = $file_name;
2659
2660 return %res;
2661}
2662
717b8311
JN
2663## ----------------------------------------------------------------------
2664## git utility subroutines, invoking git commands
42f7eb94 2665
25691fbe
DS
2666# returns path to the core git executable and the --git-dir parameter as list
2667sub git_cmd {
aa7dd05e 2668 $number_of_git_cmds++;
25691fbe
DS
2669 return $GIT, '--git-dir='.$git_dir;
2670}
2671
516381d5
LW
2672# quote the given arguments for passing them to the shell
2673# quote_command("command", "arg 1", "arg with ' and ! characters")
2674# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2675# Try to avoid using this function wherever possible.
2676sub quote_command {
2677 return join(' ',
68cedb1f 2678 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
25691fbe
DS
2679}
2680
717b8311 2681# get HEAD ref of given project as hash
847e01fb 2682sub git_get_head_hash {
b629275f
MR
2683 return git_get_full_hash(shift, 'HEAD');
2684}
2685
2686sub git_get_full_hash {
2687 return git_get_hash(@_);
2688}
2689
2690sub git_get_short_hash {
2691 return git_get_hash(@_, '--short=7');
2692}
2693
2694sub git_get_hash {
2695 my ($project, $hash, @options) = @_;
25691fbe 2696 my $o_git_dir = $git_dir;
df2c37a5 2697 my $retval = undef;
25691fbe 2698 $git_dir = "$projectroot/$project";
b629275f
MR
2699 if (open my $fd, '-|', git_cmd(), 'rev-parse',
2700 '--verify', '-q', @options, $hash) {
2701 $retval = <$fd>;
2702 chomp $retval if defined $retval;
df2c37a5 2703 close $fd;
df2c37a5 2704 }
25691fbe
DS
2705 if (defined $o_git_dir) {
2706 $git_dir = $o_git_dir;
2c5c008b 2707 }
df2c37a5
JH
2708 return $retval;
2709}
2710
717b8311
JN
2711# get type of given object
2712sub git_get_type {
2713 my $hash = shift;
2714
25691fbe 2715 open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
717b8311
JN
2716 my $type = <$fd>;
2717 close $fd or return;
2718 chomp $type;
2719 return $type;
2720}
2721
b201927a
JN
2722# repository configuration
2723our $config_file = '';
2724our %config;
2725
2726# store multiple values for single key as anonymous array reference
2727# single values stored directly in the hash, not as [ <value> ]
2728sub hash_set_multi {
2729 my ($hash, $key, $value) = @_;
2730
2731 if (!exists $hash->{$key}) {
2732 $hash->{$key} = $value;
2733 } elsif (!ref $hash->{$key}) {
2734 $hash->{$key} = [ $hash->{$key}, $value ];
2735 } else {
2736 push @{$hash->{$key}}, $value;
2737 }
2738}
2739
2740# return hash of git project configuration
2741# optionally limited to some section, e.g. 'gitweb'
2742sub git_parse_project_config {
2743 my $section_regexp = shift;
2744 my %config;
2745
2746 local $/ = "\0";
2747
2748 open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2749 or return;
2750
2751 while (my $keyval = <$fh>) {
2752 chomp $keyval;
2753 my ($key, $value) = split(/\n/, $keyval, 2);
2754
2755 hash_set_multi(\%config, $key, $value)
2756 if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2757 }
2758 close $fh;
2759
2760 return %config;
2761}
2762
df5d10a3 2763# convert config value to boolean: 'true' or 'false'
b201927a
JN
2764# no value, number > 0, 'true' and 'yes' values are true
2765# rest of values are treated as false (never as error)
2766sub config_to_bool {
2767 my $val = shift;
2768
df5d10a3
MC
2769 return 1 if !defined $val; # section.key
2770
b201927a
JN
2771 # strip leading and trailing whitespace
2772 $val =~ s/^\s+//;
2773 $val =~ s/\s+$//;
2774
df5d10a3 2775 return (($val =~ /^\d+$/ && $val) || # section.key = 1
b201927a
JN
2776 ($val =~ /^(?:true|yes)$/i)); # section.key = true
2777}
2778
2779# convert config value to simple decimal number
2780# an optional value suffix of 'k', 'm', or 'g' will cause the value
2781# to be multiplied by 1024, 1048576, or 1073741824
2782sub config_to_int {
2783 my $val = shift;
2784
2785 # strip leading and trailing whitespace
2786 $val =~ s/^\s+//;
2787 $val =~ s/\s+$//;
2788
2789 if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2790 $unit = lc($unit);
2791 # unknown unit is treated as 1
2792 return $num * ($unit eq 'g' ? 1073741824 :
2793 $unit eq 'm' ? 1048576 :
2794 $unit eq 'k' ? 1024 : 1);
2795 }
2796 return $val;
2797}
2798
2799# convert config value to array reference, if needed
2800sub config_to_multi {
2801 my $val = shift;
2802
d76a585d 2803 return ref($val) ? $val : (defined($val) ? [ $val ] : []);
b201927a
JN
2804}
2805
717b8311 2806sub git_get_project_config {
ddb8d900 2807 my ($key, $type) = @_;
717b8311 2808
7a49c254 2809 return unless defined $git_dir;
9be3614e 2810
b201927a 2811 # key sanity check
717b8311 2812 return unless ($key);
14569cd8
JN
2813 # only subsection, if exists, is case sensitive,
2814 # and not lowercased by 'git config -z -l'
2815 if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
af507944 2816 $lo =~ s/_//g;
14569cd8 2817 $key = join(".", lc($hi), $mi, lc($lo));
af507944 2818 return if ($lo =~ /\W/ || $hi =~ /\W/);
14569cd8
JN
2819 } else {
2820 $key = lc($key);
af507944
PP
2821 $key =~ s/_//g;
2822 return if ($key =~ /\W/);
14569cd8 2823 }
717b8311 2824 $key =~ s/^gitweb\.//;
717b8311 2825
b201927a
JN
2826 # type sanity check
2827 if (defined $type) {
2828 $type =~ s/^--//;
2829 $type = undef
2830 unless ($type eq 'bool' || $type eq 'int');
2831 }
2832
2833 # get config
2834 if (!defined $config_file ||
2835 $config_file ne "$git_dir/config") {
2836 %config = git_parse_project_config('gitweb');
2837 $config_file = "$git_dir/config";
2838 }
2839
df5d10a3
MC
2840 # check if config variable (key) exists
2841 return unless exists $config{"gitweb.$key"};
2842
b201927a
JN
2843 # ensure given type
2844 if (!defined $type) {
2845 return $config{"gitweb.$key"};
2846 } elsif ($type eq 'bool') {
2847 # backward compatibility: 'git config --bool' returns true/false
2848 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2849 } elsif ($type eq 'int') {
2850 return config_to_int($config{"gitweb.$key"});
2851 }
2852 return $config{"gitweb.$key"};
717b8311
JN
2853}
2854
717b8311
JN
2855# get hash of given path at given ref
2856sub git_get_hash_by_path {
2857 my $base = shift;
2858 my $path = shift || return undef;
1d782b03 2859 my $type = shift;
717b8311 2860
4b02f483 2861 $path =~ s,/+$,,;
717b8311 2862
25691fbe 2863 open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
074afaa0 2864 or die_error(500, "Open git-ls-tree failed");
717b8311
JN
2865 my $line = <$fd>;
2866 close $fd or return undef;
2867
198a2a8a
JN
2868 if (!defined $line) {
2869 # there is no tree or hash given by $path at $base
2870 return undef;
2871 }
2872
717b8311 2873 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa panic.c'
cfb04911 2874 $line =~ m/^([0-9]+) (.+) ($oid_regex)\t/;
1d782b03
JN
2875 if (defined $type && $type ne $2) {
2876 # type doesn't match
2877 return undef;
2878 }
717b8311
JN
2879 return $3;
2880}
2881
ed224dea
JN
2882# get path of entry with given hash at given tree-ish (ref)
2883# used to get 'from' filename for combined diff (merge commit) for renames
2884sub git_get_path_by_hash {
2885 my $base = shift || return;
2886 my $hash = shift || return;
2887
2888 local $/ = "\0";
2889
2890 open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2891 or return undef;
2892 while (my $line = <$fd>) {
2893 chomp $line;
2894
2895 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423 gitweb'
2896 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f gitweb/README'
2897 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2898 close $fd;
2899 return $1;
2900 }
2901 }
2902 close $fd;
2903 return undef;
2904}
2905
717b8311
JN
2906## ......................................................................
2907## git utility functions, directly accessing git repository
2908
e4e3b32b
SC
2909# get the value of config variable either from file named as the variable
2910# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2911# configuration variable in the repository config file.
2912sub git_get_file_or_project_config {
2913 my ($path, $name) = @_;
09bd7898 2914
0e121a2c 2915 $git_dir = "$projectroot/$path";
e4e3b32b
SC
2916 open my $fd, '<', "$git_dir/$name"
2917 or return git_get_project_config($name);
2918 my $conf = <$fd>;
b87d78d6 2919 close $fd;
e4e3b32b
SC
2920 if (defined $conf) {
2921 chomp $conf;
2eb54efc 2922 }
e4e3b32b
SC
2923 return $conf;
2924}
2925
2926sub git_get_project_description {
2927 my $path = shift;
2928 return git_get_file_or_project_config($path, 'description');
12a88f2f
KS
2929}
2930
d940c901
SC
2931sub git_get_project_category {
2932 my $path = shift;
2933 return git_get_file_or_project_config($path, 'category');
12a88f2f
KS
2934}
2935
d940c901 2936
0368c492
JN
2937# supported formats:
2938# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2939# - if its contents is a number, use it as tag weight,
2940# - otherwise add a tag with weight 1
2941# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2942# the same value multiple times increases tag weight
2943# * `gitweb.ctag' multi-valued repo config variable
aed93de4 2944sub git_get_project_ctags {
0368c492 2945 my $project = shift;
aed93de4
PB
2946 my $ctags = {};
2947
0368c492
JN
2948 $git_dir = "$projectroot/$project";
2949 if (opendir my $dh, "$git_dir/ctags") {
2950 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2951 foreach my $tagfile (@files) {
2952 open my $ct, '<', $tagfile
2953 or next;
2954 my $val = <$ct>;
2955 chomp $val if $val;
2956 close $ct;
2957
2958 (my $ctag = $tagfile) =~ s#.*/##;
2c162b56 2959 if ($val =~ /^\d+$/) {
0368c492
JN
2960 $ctags->{$ctag} = $val;
2961 } else {
2962 $ctags->{$ctag} = 1;
2963 }
2964 }
2965 closedir $dh;
2966
2967 } elsif (open my $fh, '<', "$git_dir/ctags") {
2968 while (my $line = <$fh>) {
2969 chomp $line;
2970 $ctags->{$line}++ if $line;
2971 }
2972 close $fh;
2973
2974 } else {
2975 my $taglist = config_to_multi(git_get_project_config('ctag'));
2976 foreach my $tag (@$taglist) {
2977 $ctags->{$tag}++;
2978 }
aed93de4 2979 }
0368c492
JN
2980
2981 return $ctags;
2982}
2983
2984# return hash, where keys are content tags ('ctags'),
2985# and values are sum of weights of given tag in every project
2986sub git_gather_all_ctags {
2987 my $projects = shift;
2988 my $ctags = {};
2989
2990 foreach my $p (@$projects) {
2991 foreach my $ct (keys %{$p->{'ctags'}}) {
2992 $ctags->{$ct} += $p->{'ctags'}->{$ct};
2993 }
aed93de4 2994 }
0368c492
JN
2995
2996 return $ctags;
aed93de4
PB
2997}
2998
2999sub git_populate_project_tagcloud {
3000 my $ctags = shift;
3001
3002 # First, merge different-cased tags; tags vote on casing
3003 my %ctags_lc;
3004 foreach (keys %$ctags) {
3005 $ctags_lc{lc $_}->{count} += $ctags->{$_};
3006 if (not $ctags_lc{lc $_}->{topcount}
3007 or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
3008 $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
3009 $ctags_lc{lc $_}->{topname} = $_;
3010 }
3011 }
3012
3013 my $cloud;
84d9e2d5 3014 my $matched = $input_params{'ctag'};
aed93de4
PB
3015 if (eval { require HTML::TagCloud; 1; }) {
3016 $cloud = HTML::TagCloud->new;
0368c492 3017 foreach my $ctag (sort keys %ctags_lc) {
aed93de4
PB
3018 # Pad the title with spaces so that the cloud looks
3019 # less crammed.
0368c492 3020 my $title = esc_html($ctags_lc{$ctag}->{topname});
aed93de4
PB
3021 $title =~ s/ /&nbsp;/g;
3022 $title =~ s/^/&nbsp;/g;
3023 $title =~ s/$/&nbsp;/g;
4b9447f9
JN
3024 if (defined $matched && $matched eq $ctag) {
3025 $title = qq(<span class="match">$title</span>);
3026 }
0368c492
JN
3027 $cloud->add($title, href(project=>undef, ctag=>$ctag),
3028 $ctags_lc{$ctag}->{count});
aed93de4
PB
3029 }
3030 } else {
0368c492
JN
3031 $cloud = {};
3032 foreach my $ctag (keys %ctags_lc) {
4b9447f9
JN
3033 my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
3034 if (defined $matched && $matched eq $ctag) {
3035 $title = qq(<span class="match">$title</span>);
3036 }
0368c492
JN
3037 $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
3038 $cloud->{$ctag}{ctag} =
4b9447f9 3039 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
0368c492 3040 }
aed93de4 3041 }
0368c492 3042 return $cloud;
aed93de4
PB
3043}
3044
3045sub git_show_project_tagcloud {
3046 my ($cloud, $count) = @_;
aed93de4
PB
3047 if (ref $cloud eq 'HTML::TagCloud') {
3048 return $cloud->html_and_css($count);
3049 } else {
0368c492
JN
3050 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
3051 return
3052 '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
3053 join (', ', map {
3054 $cloud->{$_}->{'ctag'}
3055 } splice(@tags, 0, $count)) .
3056 '</div>';
aed93de4
PB
3057 }
3058}
3059
e79ca7cc
JN
3060sub git_get_project_url_list {
3061 my $path = shift;
3062
0e121a2c 3063 $git_dir = "$projectroot/$path";
dff2b6d4 3064 open my $fd, '<', "$git_dir/cloneurl"
0e121a2c
JN
3065 or return wantarray ?
3066 @{ config_to_multi(git_get_project_config('url')) } :
3067 config_to_multi(git_get_project_config('url'));
e79ca7cc
JN
3068 my @git_project_url_list = map { chomp; $_ } <$fd>;
3069 close $fd;
3070
3071 return wantarray ? @git_project_url_list : \@git_project_url_list;
3072}
3073
847e01fb 3074sub git_get_projects_list {
12b1443c 3075 my $filter = shift || '';
348a6589 3076 my $paranoid = shift;
717b8311
JN
3077 my @list;
3078
3079 if (-d $projects_list) {
3080 # search in directory
12b1443c 3081 my $dir = $projects_list;
6768d6b8
AK
3082 # remove the trailing "/"
3083 $dir =~ s!/+$!!;
ac593b76
MM
3084 my $pfxlen = length("$dir");
3085 my $pfxdepth = ($dir =~ tr!/!!);
12b1443c 3086 # when filtering, search only given subdirectory
348a6589 3087 if ($filter && !$paranoid) {
12b1443c
JN
3088 $dir .= "/$filter";
3089 $dir =~ s!/+$!!;
3090 }
c0011ff8
JN
3091
3092 File::Find::find({
3093 follow_fast => 1, # follow symbolic links
d20602ee 3094 follow_skip => 2, # ignore duplicates
c0011ff8
JN
3095 dangling_symlinks => 0, # ignore dangling symlinks, silently
3096 wanted => sub {
ee1d8ee0
JN
3097 # global variables
3098 our $project_maxdepth;
3099 our $projectroot;
c0011ff8
JN
3100 # skip project-list toplevel, if we get it.
3101 return if (m!^[/.]$!);
3102 # only directories can be git repositories
3103 return unless (-d $_);
46a13857
HCB
3104 # need search permission
3105 return unless (-x $_);
ca5e9495 3106 # don't traverse too deep (Find is super slow on os x)
12b1443c 3107 # $project_maxdepth excludes depth of $projectroot
ca5e9495
LL
3108 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
3109 $File::Find::prune = 1;
3110 return;
3111 }
c0011ff8 3112
12b1443c 3113 my $path = substr($File::Find::name, $pfxlen + 1);
348a6589
BL
3114 # paranoidly only filter here
3115 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
3116 next;
3117 }
c0011ff8 3118 # we check related file in $projectroot
fb3bb3d1
DD
3119 if (check_export_ok("$projectroot/$path")) {
3120 push @list, { path => $path };
c0011ff8
JN
3121 $File::Find::prune = 1;
3122 }
3123 },
3124 }, "$dir");
3125
717b8311
JN
3126 } elsif (-f $projects_list) {
3127 # read from file(url-encoded):
3128 # 'git%2Fgit.git Linus+Torvalds'
3129 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3130 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
dff2b6d4 3131 open my $fd, '<', $projects_list or return;
c2b8b134 3132 PROJECT:
717b8311
JN
3133 while (my $line = <$fd>) {
3134 chomp $line;
3135 my ($path, $owner) = split ' ', $line;
3136 $path = unescape($path);
3137 $owner = unescape($owner);
3138 if (!defined $path) {
3139 next;
3140 }
12b1443c
JN
3141 # if $filter is rpovided, check if $path begins with $filter
3142 if ($filter && $path !~ m!^\Q$filter\E/!) {
3143 next;
83ee94c1 3144 }
2172ce4b 3145 if (check_export_ok("$projectroot/$path")) {
717b8311 3146 my $pr = {
75e0dffe 3147 path => $path
717b8311 3148 };
75e0dffe
KK
3149 if ($owner) {
3150 $pr->{'owner'} = to_utf8($owner);
3151 }
c2b8b134 3152 push @list, $pr;
717b8311
JN
3153 }
3154 }
3155 close $fd;
3156 }
717b8311
JN
3157 return @list;
3158}
3159
64127575 3160# written with help of Tree::Trie module (Perl Artistic License, GPL compatible)
12b1443c
JN
3161# as side effects it sets 'forks' field to list of forks for forked projects
3162sub filter_forks_from_projects_list {
3163 my $projects = shift;
3164
3165 my %trie; # prefix tree of directories (path components)
3166 # generate trie out of those directories that might contain forks
3167 foreach my $pr (@$projects) {
3168 my $path = $pr->{'path'};
3169 $path =~ s/\.git$//; # forks of 'repo.git' are in 'repo/' directory
3170 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3171 next unless ($path); # skip '.git' repository: tests, git-instaweb
53c632fa 3172 next unless (-d "$projectroot/$path"); # containing directory exists
12b1443c
JN
3173 $pr->{'forks'} = []; # there can be 0 or more forks of project
3174
3175 # add to trie
3176 my @dirs = split('/', $path);
3177 # walk the trie, until either runs out of components or out of trie
3178 my $ref = \%trie;
3179 while (scalar @dirs &&
3180 exists($ref->{$dirs[0]})) {
3181 $ref = $ref->{shift @dirs};
3182 }
3183 # create rest of trie structure from rest of components
3184 foreach my $dir (@dirs) {
3185 $ref = $ref->{$dir} = {};
3186 }
3187 # create end marker, store $pr as a data
3188 $ref->{''} = $pr if (!exists $ref->{''});
3189 }
3190
3191 # filter out forks, by finding shortest prefix match for paths
3192 my @filtered;
3193 PROJECT:
3194 foreach my $pr (@$projects) {
3195 # trie lookup
3196 my $ref = \%trie;
3197 DIR:
3198 foreach my $dir (split('/', $pr->{'path'})) {
3199 if (exists $ref->{''}) {
3200 # found [shortest] prefix, is a fork - skip it
3201 push @{$ref->{''}{'forks'}}, $pr;
3202 next PROJECT;
3203 }
3204 if (!exists $ref->{$dir}) {
3205 # not in trie, cannot have prefix, not a fork
3206 push @filtered, $pr;
3207 next PROJECT;
3208 }
3209 # If the dir is there, we just walk one step down the trie.
3210 $ref = $ref->{$dir};
3211 }
3212 # we ran out of trie
3213 # (shouldn't happen: it's either no match, or end marker)
3214 push @filtered, $pr;
3215 }
3216
3217 return @filtered;
3218}
3219
3220# note: fill_project_list_info must be run first,
3221# for 'descr_long' and 'ctags' to be filled
3222sub search_projects_list {
3223 my ($projlist, %opts) = @_;
3224 my $tagfilter = $opts{'tagfilter'};
e65ceb61 3225 my $search_re = $opts{'search_regexp'};
12b1443c
JN
3226
3227 return @$projlist
e65ceb61 3228 unless ($tagfilter || $search_re);
12b1443c 3229
07b257f9
JN
3230 # searching projects require filling to be run before it;
3231 fill_project_list_info($projlist,
3232 $tagfilter ? 'ctags' : (),
aa145bf6 3233 $search_re ? ('path', 'descr') : ());
12b1443c
JN
3234 my @projects;
3235 PROJECT:
3236 foreach my $pr (@$projlist) {
3237
3238 if ($tagfilter) {
3239 next unless ref($pr->{'ctags'}) eq 'HASH';
3240 next unless
3241 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3242 }
3243
e65ceb61 3244 if ($search_re) {
12b1443c 3245 next unless
e65ceb61
JN
3246 $pr->{'path'} =~ /$search_re/ ||
3247 $pr->{'descr_long'} =~ /$search_re/;
12b1443c
JN
3248 }
3249
3250 push @projects, $pr;
3251 }
3252
3253 return @projects;
3254}
3255
47852450
JH
3256our $gitweb_project_owner = undef;
3257sub git_get_project_list_from_file {
1e0cf030 3258
47852450 3259 return if (defined $gitweb_project_owner);
1e0cf030 3260
47852450 3261 $gitweb_project_owner = {};
1e0cf030
JN
3262 # read from file (url-encoded):
3263 # 'git%2Fgit.git Linus+Torvalds'
3264 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3265 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3266 if (-f $projects_list) {
dff2b6d4 3267 open(my $fd, '<', $projects_list);
1e0cf030
JN
3268 while (my $line = <$fd>) {
3269 chomp $line;
3270 my ($pr, $ow) = split ' ', $line;
3271 $pr = unescape($pr);
3272 $ow = unescape($ow);
47852450 3273 $gitweb_project_owner->{$pr} = to_utf8($ow);
1e0cf030
JN
3274 }
3275 close $fd;
3276 }
47852450
JH
3277}
3278
3279sub git_get_project_owner {
3280 my $project = shift;
3281 my $owner;
3282
3283 return undef unless $project;
b59012ef 3284 $git_dir = "$projectroot/$project";
47852450
JH
3285
3286 if (!defined $gitweb_project_owner) {
3287 git_get_project_list_from_file();
3288 }
3289
3290 if (exists $gitweb_project_owner->{$project}) {
3291 $owner = $gitweb_project_owner->{$project};
3292 }
b59012ef
BR
3293 if (!defined $owner){
3294 $owner = git_get_project_config('owner');
3295 }
1e0cf030 3296 if (!defined $owner) {
b59012ef 3297 $owner = get_file_owner("$git_dir");
1e0cf030
JN
3298 }
3299
3300 return $owner;
3301}
3302
c60c56cc
JN
3303sub git_get_last_activity {
3304 my ($path) = @_;
3305 my $fd;
3306
3307 $git_dir = "$projectroot/$path";
3308 open($fd, "-|", git_cmd(), 'for-each-ref',
0ff5ec70 3309 '--format=%(committer)',
c60c56cc 3310 '--sort=-committerdate',
0ff5ec70 3311 '--count=1',
8d646a9b 3312 map { "refs/$_" } get_branch_refs ()) or return;
c60c56cc
JN
3313 my $most_recent = <$fd>;
3314 close $fd or return;
785cdea9
JN
3315 if (defined $most_recent &&
3316 $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
c60c56cc
JN
3317 my $timestamp = $1;
3318 my $age = time - $timestamp;
3319 return ($age, age_string($age));
3320 }
c956395e 3321 return (undef, undef);
c60c56cc
JN
3322}
3323
9d0d42f3
GB
3324# Implementation note: when a single remote is wanted, we cannot use 'git
3325# remote show -n' because that command always work (assuming it's a remote URL
3326# if it's not defined), and we cannot use 'git remote show' because that would
3327# try to make a network roundtrip. So the only way to find if that particular
3328# remote is defined is to walk the list provided by 'git remote -v' and stop if
3329# and when we find what we want.
3330sub git_get_remotes_list {
3331 my $wanted = shift;
3332 my %remotes = ();
3333
3334 open my $fd, '-|' , git_cmd(), 'remote', '-v';
3335 return unless $fd;
3336 while (my $remote = <$fd>) {
3337 chomp $remote;
3338 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3339 next if $wanted and not $remote eq $wanted;
3340 my ($url, $key) = ($1, $2);
3341
3342 $remotes{$remote} ||= { 'heads' => () };
3343 $remotes{$remote}{$key} = $url;
3344 }
3345 close $fd or return;
3346 return wantarray ? %remotes : \%remotes;
3347}
3348
3349# Takes a hash of remotes as first parameter and fills it by adding the
3350# available remote heads for each of the indicated remotes.
3351sub fill_remote_heads {
3352 my $remotes = shift;
3353 my @heads = map { "remotes/$_" } keys %$remotes;
3354 my @remoteheads = git_get_heads_list(undef, @heads);
3355 foreach my $remote (keys %$remotes) {
3356 $remotes->{$remote}{'heads'} = [ grep {
3357 $_->{'name'} =~ s!^$remote/!!
3358 } @remoteheads ];
3359 }
3360}
3361
847e01fb 3362sub git_get_references {
717b8311
JN
3363 my $type = shift || "";
3364 my %refs;
28b9d9f7
JN
3365 # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3366 # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3367 open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3368 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
9704d75d 3369 or return;
d294e1ca 3370
717b8311
JN
3371 while (my $line = <$fd>) {
3372 chomp $line;
cfb04911 3373 if ($line =~ m!^($oid_regex)\srefs/($type.*)$!) {
717b8311 3374 if (defined $refs{$1}) {
d294e1ca 3375 push @{$refs{$1}}, $2;
717b8311 3376 } else {
d294e1ca 3377 $refs{$1} = [ $2 ];
717b8311
JN
3378 }
3379 }
3380 }
3381 close $fd or return;
3382 return \%refs;
3383}
3384
56a322f1
JN
3385sub git_get_rev_name_tags {
3386 my $hash = shift || return undef;
3387
25691fbe 3388 open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
56a322f1
JN
3389 or return;
3390 my $name_rev = <$fd>;
3391 close $fd;
3392
3393 if ($name_rev =~ m|^$hash tags/(.*)$|) {
3394 return $1;
3395 } else {
3396 # catches also '$hash undefined' output
3397 return undef;
3398 }
3399}
3400
717b8311
JN
3401## ----------------------------------------------------------------------
3402## parse to hash functions
3403
847e01fb 3404sub parse_date {
717b8311
JN
3405 my $epoch = shift;
3406 my $tz = shift || "-0000";
3407
3408 my %date;
3409 my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3410 my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3411 my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3412 $date{'hour'} = $hour;
3413 $date{'minute'} = $min;
3414 $date{'mday'} = $mday;
3415 $date{'day'} = $days[$wday];
3416 $date{'month'} = $months[$mon];
af6feeb2
JN
3417 $date{'rfc2822'} = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3418 $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
952c65fc
JN
3419 $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3420 $mday, $months[$mon], $hour ,$min;
af6feeb2 3421 $date{'iso-8601'} = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
a62d6d84 3422 1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
717b8311 3423
2b1e1723
JN
3424 my ($tz_sign, $tz_hour, $tz_min) =
3425 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3426 $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3427 my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
717b8311
JN
3428 ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3429 $date{'hour_local'} = $hour;
3430 $date{'minute_local'} = $min;
3431 $date{'tz_local'} = $tz;
af6feeb2
JN
3432 $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3433 1900+$year, $mon+1, $mday,
3434 $hour, $min, $sec, $tz);
717b8311
JN
3435 return %date;
3436}
3437
847e01fb 3438sub parse_tag {
ede5e100
KS
3439 my $tag_id = shift;
3440 my %tag;
d8a20ba9 3441 my @comment;
ede5e100 3442
25691fbe 3443 open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
d8a20ba9 3444 $tag{'id'} = $tag_id;
ede5e100
KS
3445 while (my $line = <$fd>) {
3446 chomp $line;
cfb04911 3447 if ($line =~ m/^object ($oid_regex)$/) {
ede5e100 3448 $tag{'object'} = $1;
7ab0d2b6 3449 } elsif ($line =~ m/^type (.+)$/) {
ede5e100 3450 $tag{'type'} = $1;
7ab0d2b6 3451 } elsif ($line =~ m/^tag (.+)$/) {
ede5e100 3452 $tag{'name'} = $1;
d8a20ba9
KS
3453 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3454 $tag{'author'} = $1;
ba924733
GB
3455 $tag{'author_epoch'} = $2;
3456 $tag{'author_tz'} = $3;
3457 if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3458 $tag{'author_name'} = $1;
3459 $tag{'author_email'} = $2;
3460 } else {
3461 $tag{'author_name'} = $tag{'author'};
3462 }
d8a20ba9
KS
3463 } elsif ($line =~ m/--BEGIN/) {
3464 push @comment, $line;
3465 last;
3466 } elsif ($line eq "") {
3467 last;
ede5e100
KS
3468 }
3469 }
d8a20ba9
KS
3470 push @comment, <$fd>;
3471 $tag{'comment'} = \@comment;
19806691 3472 close $fd or return;
ede5e100
KS
3473 if (!defined $tag{'name'}) {
3474 return
3475 };
3476 return %tag
3477}
3478
756bbf54 3479sub parse_commit_text {
ccdfdea0 3480 my ($commit_text, $withparents) = @_;
756bbf54 3481 my @commit_lines = split '\n', $commit_text;
703ac710 3482 my %co;
703ac710 3483
756bbf54
RF
3484 pop @commit_lines; # Remove '\0'
3485
198a2a8a
JN
3486 if (! @commit_lines) {
3487 return;
3488 }
3489
25f422fb 3490 my $header = shift @commit_lines;
cfb04911 3491 if ($header !~ m/^$oid_regex/) {
25f422fb
KS
3492 return;
3493 }
ccdfdea0 3494 ($co{'id'}, my @parents) = split ' ', $header;
19806691 3495 while (my $line = shift @commit_lines) {
b87d78d6 3496 last if $line eq "\n";
cfb04911 3497 if ($line =~ m/^tree ($oid_regex)$/) {
703ac710 3498 $co{'tree'} = $1;
cfb04911 3499 } elsif ((!defined $withparents) && ($line =~ m/^parent ($oid_regex)$/)) {
208b2dff 3500 push @parents, $1;
022be3d0 3501 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
5ed5bbc7 3502 $co{'author'} = to_utf8($1);
185f09e5
KS
3503 $co{'author_epoch'} = $2;
3504 $co{'author_tz'} = $3;
ba00b8c1
JN
3505 if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3506 $co{'author_name'} = $1;
3507 $co{'author_email'} = $2;
2bf7a52c
KS
3508 } else {
3509 $co{'author_name'} = $co{'author'};
3510 }
86eed32d 3511 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
5ed5bbc7 3512 $co{'committer'} = to_utf8($1);
185f09e5
KS
3513 $co{'committer_epoch'} = $2;
3514 $co{'committer_tz'} = $3;
ba00b8c1
JN
3515 if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3516 $co{'committer_name'} = $1;
3517 $co{'committer_email'} = $2;
3518 } else {
3519 $co{'committer_name'} = $co{'committer'};
3520 }
703ac710
KS
3521 }
3522 }
ede5e100 3523 if (!defined $co{'tree'}) {
25f422fb 3524 return;
ede5e100 3525 };
208b2dff
RF
3526 $co{'parents'} = \@parents;
3527 $co{'parent'} = $parents[0];
25f422fb 3528
19806691 3529 foreach my $title (@commit_lines) {
c2488d06 3530 $title =~ s/^ //;
19806691 3531 if ($title ne "") {
48c771f4 3532 $co{'title'} = chop_str($title, 80, 5);
19806691
KS
3533 # remove leading stuff of merges to make the interesting part visible
3534 if (length($title) > 50) {
3535 $title =~ s/^Automatic //;
3536 $title =~ s/^merge (of|with) /Merge ... /i;
3537 if (length($title) > 50) {
3538 $title =~ s/(http|rsync):\/\///;
3539 }
3540 if (length($title) > 50) {
3541 $title =~ s/(master|www|rsync)\.//;
3542 }
3543 if (length($title) > 50) {
3544 $title =~ s/kernel.org:?//;
3545 }
3546 if (length($title) > 50) {
3547 $title =~ s/\/pub\/scm//;
3548 }
3549 }