#!/usr/bin/perl use strict; use warnings; use Data::Dumper; $Data::Dumper::Indent = 1; $Data::Dumper::Sortkeys = 1; # === add-auth-keys === # part of the gitolite (GL) suite # (1) - "compiles" ~/.ssh/authorized_keys from the list of pub-keys # (2) - also "compiles" the user-friendly GL conf file into something easier # to parse. We're doing this because both the gl-auth-command and the # (gl-)update hook need this, and it seems easier to do this than # replicate the parsing code in both those places. As a bonus, it's # probably more efficient. # (3) - finally does what I have resisted doing all along -- handle gitweb and # git-daemon access. It won't *setup* gitweb/daemon for you -- you have # to that yourself. What this does is make sure that "repo.git" # contains the file "git-daemon-export-ok" (for daemon case) and the # line "repo.git" exists in the "projects.list" file (for gitweb case). # how run: manual, by GL admin # when: # - anytime a pubkey is added/deleted # - anytime gitolite.conf is changed # input: # - GL_CONF (default: ~/.gitolite/conf/gitolite.conf) # - GL_KEYDIR (default: ~/.gitolite/keydir) # output: # - ~/.ssh/authorized_keys (dictated by sshd) # - GL_CONF_COMPILED (default: ~/.gitolite/conf/gitolite.conf-compiled.pm) # security: # - touches a very critical system file that manages the restrictions on # incoming users. Be sure to audit AUTH_COMMAND and AUTH_OPTIONS (see # below) on any change to this script # - no security checks within program. The GL admin runs this manually # warnings: # - if the "start" line exists, but the "end" line does not, you lose the # rest of the existing authkey file. In general, "don't do that (TM)", # but we do have a "vim -d" popping up so you can see the changes being # made, just in case... # ---------------------------------------------------------------------------- # common definitions # ---------------------------------------------------------------------------- # setup quiet mode if asked; please do not use this when running manually open STDOUT, ">", "/dev/null" if (@ARGV and shift eq '-q'); # these are set by the "rc" file our ($GL_ADMINDIR, $GL_CONF, $GL_KEYDIR, $GL_CONF_COMPILED, $REPO_BASE, $REPO_UMASK, $PROJECTS_LIST, $GIT_PATH, $GL_WILDREPOS, $GL_GITCONFIG_KEYS, $GL_GITCONFIG_WILD, $GL_PACKAGE_HOOKS, $GL_BIG_CONFIG, $GL_NO_DAEMON_NO_GITWEB, $GL_NO_CREATE_REPOS, $GL_NO_SETUP_AUTHKEYS); # and these are set by gitolite.pm our ($REPONAME_PATT, $REPOPATT_PATT, $USERNAME_PATT, $ABRT, $WARN); # the common setup module is in the same directory as this running program is my $bindir = $0; $bindir =~ s/\/[^\/]+$//; $bindir = "$ENV{PWD}/$bindir" unless $bindir =~ /^\//; require "$bindir/gitolite.pm"; # ask where the rc file is, get it, and "do" it &where_is_rc(); die "$ABRT parse $ENV{GL_RC} failed: " . ($! or $@) unless do $ENV{GL_RC}; # add a custom path for git binaries, if specified $ENV{PATH} .= ":$GIT_PATH" if $GIT_PATH; # ---------------------------------------------------------------------------- # definitions specific to this program # ---------------------------------------------------------------------------- # groups can now represent user groups or repo groups. # $groups{group}{member} = "master" (or name of fragment file in which the # group is defined). our %groups = (); # %repos has two functions. # $repos{repo}{R|W}{user} = 1 if user has R (or W) permissions for at least # one branch in repo. This is used by the "level 1 check" (see faq). There's # also the new "C" (create a repo) permission now # $repos{repo}{user} is a list of {ref, perms} pairs. This is used by the # level 2 check. In order to allow "exclude" rules, the order of rules now # matters, so what used to be entirely "hash of hash of hash" now has a list # in between :) my %repos = (); # rule sequence number my $rule_seq = 0; # ... having been forced to use a list as described above, we lose some # efficiency due to the possibility of the same {ref, perms} pair showing up # multiple times for the same repo+user. So... my %rurp_seen = (); our $current_data_version; # this comes from gitolite.pm # catch usernames<->pubkeys mismatches; search for "lint" below my %user_list = (); # repo configurations my %repo_config = (); # gitweb descriptions and owners; plain text, keyed by "$repo.git" my %desc = (); my %owner = (); # set the umask before creating any files umask($REPO_UMASK); # ---------------------------------------------------------------------------- # subroutines # ---------------------------------------------------------------------------- sub expand_list { my @list = @_; my @new_list = (); for my $item (@list) { if ($item =~ /^@/) # nested group { die "$ABRT undefined group $item\n" unless $groups{$item}; # add those names to the list push @new_list, sort keys %{ $groups{$item} }; } else { push @new_list, $item; } } return @new_list; } # ---------------------------------------------------------------------------- # "compile" GL conf # ---------------------------------------------------------------------------- sub parse_conf_file { my ($conffile, $fragment) = @_; # the second arg, $fragment, is passed in as "master" when parsing the # main config, and the fragment name when parsing a fragment. In the # latter case, the parser uses that information to ignore (and warn about) # any repos in the fragment that are not members of the "repo group" of # the same name. my %ignored = (); my $conf_fh = wrap_open( "<", $conffile ); # the syntax is fairly simple, so we parse it inline my @repos; while (<$conf_fh>) { # kill comments, but take care of "#" inside *simple* strings s/^((".*?"|[^#"])*)#.*/$1/; # normalise whitespace; keeps later regexes very simple s/=/ = /; s/\s+/ /g; s/^ //; s/ $//; # and blank lines next unless /\S/; # user or repo groups if (/^(@\S+) = (.*)/) { die "$ABRT defining groups is not allowed inside fragments\n" if $GL_BIG_CONFIG and $fragment ne 'master'; # store the members of each group as hash key. Keep track of when # the group was *first* created by using $fragment as the *value* do { $groups{$1}{$_} ||= $fragment } for ( expand_list( split(' ', $2) ) ); die "$ABRT bad group $1\n" unless $1 =~ $REPONAME_PATT; } # repo(s) elsif (/^repo (.*)/) { # grab the list... @repos = split ' ', $1; unless (@repos == 1 and $repos[0] eq '@all') { # ...expand groups in the default case @repos = expand_list ( @repos ) unless $GL_BIG_CONFIG; # ...sanity check for (@repos) { die "$ABRT bad reponame $_\n" if ($GL_WILDREPOS and $_ !~ $REPOPATT_PATT); die "$ABRT bad reponame $_ or you forgot to set \$GL_WILDREPOS\n" if (not $GL_WILDREPOS and $_ !~ $REPONAME_PATT); } } s/\bCREAT[EO]R\b/\$creator/g for @repos; } # actual permission line elsif (/^(-|C|R|RW\+?(?:C?D?|D?C?)) (.* )?= (.+)/) { my $perms = $1; my @refs; @refs = split(' ', $2) if $2; @refs = expand_list ( @refs ); my @users = split ' ', $3; die "$ABRT \$GL_WILDREPOS is not set, you cant use 'C' in config\n" if $perms eq 'C' and not $GL_WILDREPOS; # if no ref is given, this PERM applies to all refs @refs = qw(refs/.*) unless @refs; # deprecation warning map { warn "WARNING: old syntax 'PATH/' found; please use new syntax 'NAME/'\n" if s(^PATH/)(NAME/) } @refs; # fully qualify refs that dont start with "refs/" or "NAME/"; # prefix them with "refs/heads/" @refs = map { m(^(refs|NAME)/) or s(^)(refs/heads/); $_ } @refs; @refs = map { s(/USER/)(/\$gl_user/); $_ } @refs; # expand the user list, unless it is just "@all" @users = expand_list ( @users ) unless ($GL_BIG_CONFIG or (@users == 1 and $users[0] eq '@all')); do { die "$ABRT bad username $_\n" unless $_ =~ $USERNAME_PATT } for @users; s/\bCREAT[EO]R\b/~\$creator/g for @users; s/\bREADERS\b/\$readers/g for @users; s/\bWRITERS\b/\$writers/g for @users; # ok, we can finally populate the %repos hash for my $repo (@repos) # each repo in the current stanza { # if we're processing a delegated config file (not the master # config), we need to prevent attempts by that admin to obtain # rights on stuff outside his domain # trying to set access for $repo (='foo')... if ( # processing the master config, not a fragment ( $fragment eq 'master' ) or # fragment is also called 'foo' (you're allowed to have a # fragment that is only concerned with one repo) ( $fragment eq $repo ) or # same thing in big-config-land; foo is just @foo now ( $GL_BIG_CONFIG and "\@$fragment" eq $repo ) or # fragment is called "bar" and "@bar = foo" has been # defined in the master config ( ($groups{"\@$fragment"}{$repo} || '') eq 'master' ) ) { # all these are fine } else { # this is a little more complex # fragment is called "bar", one or more "@bar = regex" # have been specified in master, and "foo" matches some # such "regex" my @matched = grep { $repo =~ /^$_$/ } grep { $groups{"\@$fragment"}{$_} eq 'master' } sort keys %{ $groups{"\@$fragment"} }; if (@matched < 1) { $ignored{$fragment}{$repo} = 1; next; } } for my $user (@users) { # lint check, to catch pubkey/username typos if ($user =~ /^@/ and $user ne '@all') { # this is a usergroup, not a normal user; happens with GL_BIG_CONFIG if (exists $groups{$user}) { $user_list{$_}++ for keys %{ $groups{$user} }; } } else { $user_list{$user}++; } # for 1st level check (see faq/tips doc) $repos{$repo}{C}{$user} = 1, next if $perms eq 'C'; $repos{$repo}{R}{$user} = 1 if $perms =~ /R/; $repos{$repo}{W}{$user} = 1 if $perms =~ /W|D/; # if the user specified even a single 'D' anywhere, make # that fact easy to find; this changes the meaning of RW+ # to no longer permit deletes (see update hook) $repos{$repo}{DELETE_IS_D} = 1 if $perms =~ /D/; $repos{$repo}{CREATE_IS_C} = 1 if $perms =~ /RW.*C/; # for 2nd level check, store each "ref, perms" pair in order for my $ref (@refs) { # checking NAME based restrictions is expensive for # the update hook (see the changes to src/hooks/update # in this commit for why) so we would *very* much like # to avoid doing it for the large majority of repos # that do *not* use NAME limits. Setting a flag that # can be checked right away will help us do that $repos{$repo}{NAME_LIMITS} = 1 if $ref =~ /^NAME\//; my $p_user = $user; $p_user =~ s/(creator|readers|writers)$/$1 - wild/; push @{ $repos{$repo}{$p_user} }, [ $rule_seq++, $ref, $perms ] unless $rurp_seen{$repo}{$p_user}{$ref}{$perms}++; } } } } # configuration elsif (/^config (.+) = ?(.*)/) { my ($key, $value) = ($1, $2); my @validkeys = split (' ', ($GL_GITCONFIG_KEYS || '')); my @matched = grep { $key =~ /^$_$/ } @validkeys; die "$ABRT git config $key not allowed\n" if (@matched < 1); for my $repo (@repos) # each repo in the current stanza { $repo_config{$repo}{$key} = $value; print STDERR "$WARN git config set for $repo but \$GL_GITCONFIG_WILD not set\n" unless $repo =~ $REPONAME_PATT or $GL_GITCONFIG_WILD; } } # include elsif (/^include "(.+)"/) { my $file = $1; $file = "$GL_ADMINDIR/conf/$file" unless $file =~ /^\//; die "$WARN $fragment attempting to include configuration\n" if $fragment ne 'master'; die "$ABRT included file not found: '$file'\n" unless -f $file; parse_conf_file($file, $fragment); } # very simple syntax for the gitweb description of repo; one of: # reponame = "some description string" # reponame "owner name" = "some description string" elsif (/^(\S+)(?: "(.*?)")? = "(.*)"$/) { my ($repo, $owner, $desc) = ($1, $2, $3); die "$ABRT bad repo name $repo\n" unless $repo =~ $REPONAME_PATT; die "$WARN $fragment attempting to set description for $repo\n" if $fragment ne 'master' and $fragment ne $repo and ($groups{"\@$fragment"}{$repo} || '') ne 'master'; $desc{"$repo.git"} = $desc; $owner{"$repo.git"} = $owner || ''; } else { die "$ABRT can't make head or tail of '$_'\n"; } } for my $ig (sort keys %ignored) { warn "\n\t\t***** WARNING *****\n" . "\t$ig.conf attempting to set access for " . join (", ", sort keys %{ $ignored{$ig} }) . "\n"; } } # parse the main config file parse_conf_file($GL_CONF, 'master'); # parse any delegated fragments wrap_chdir($GL_ADMINDIR); for my $fragment_file (glob("conf/fragments/*.conf")) { # we already check (elsewhere) that a fragment called "foo" will not try # to specify access control for a repo whose name is not "foo" or is not # part of a group called "foo" created by master # meanwhile, I found a possible attack where the admin for group B creates # a "convenience" group of (a subset of) his users, and then the admin for # repo group A (alphabetically before B) adds himself to that same group # in his own fragment. # as a result, admin_A now has access to group B repos :( # so now we lock the groups hash to the value it had after parsing # "master", and localise any changes to it by this fragment so that they # don't propagate to the next fragment. Thus, each fragment now has only # those groups that are defined in "master" and itself local %groups = %groups; my $fragment = $fragment_file; $fragment =~ s/^conf\/fragments\/(.*).conf$/$1/; parse_conf_file($fragment_file, $fragment); } my $compiled_fh = wrap_open( ">", "$GL_CONF_COMPILED.new" ); my $data_version = $current_data_version; print $compiled_fh Data::Dumper->Dump([$data_version], [qw(*data_version)]); my $dumped_data = Data::Dumper->Dump([\%repos], [qw(*repos)]); $dumped_data .= Data::Dumper->Dump([\%repo_config], [qw(*repo_config)]) if %repo_config; # the dump uses single quotes, but we convert any strings containing $creator, # $readers, $writers, to double quoted strings. A wee bit sneaky, but not too # much... $dumped_data =~ s/'(?=[^']*\$(?:creator|readers|writers|gl_user))~?(.*?)'/"$1"/g; print $compiled_fh $dumped_data; print $compiled_fh Data::Dumper->Dump([\%groups], [qw(*groups)]) if $GL_BIG_CONFIG and %groups; close $compiled_fh or die "$ABRT close compiled-conf failed: $!\n"; rename "$GL_CONF_COMPILED.new", "$GL_CONF_COMPILED"; # ---------------------------------------------------------------------------- # (that ends the config file compiler and write) # ---------------------------------------------------------------------------- # ---------------------------------------------------------------------------- # what's the git version? # ---------------------------------------------------------------------------- # we don't like stuff older than 1.6.2 my $git_version = `git --version`; die " *** ERROR *** did not get a proper version number. Please see if git is in the PATH on the server. If it is not, please edit ~/.gitolite.rc on the server and set the \$GIT_PATH variable to the correct value\n " unless $git_version; my ($gv_maj, $gv_min, $gv_patchrel) = ($git_version =~ m/git version (\d+)\.(\d+)\.(\d+)/); die "$ABRT I can't understand $git_version\n" unless ($gv_maj >= 1); $git_version = $gv_maj*10000 + $gv_min*100 + $gv_patchrel; # now it's "normalised" die "\n\t\t***** AAARGH! *****\n" . "\tyour git version is older than 1.6.2\n" . "\tsince that is now more than one year old, and gitolite needs some of\n" . "\tthe newer features, please upgrade.\n" if $git_version < 10602; # that's 1.6.2 to you # ---------------------------------------------------------------------------- # the rest of this program can be "switched off"; see doc/big-config.mkd for # details. # ---------------------------------------------------------------------------- # ---------------------------------------------------------------------------- # any new repos to be created? # ---------------------------------------------------------------------------- # repo-base needs to be an absolute path for this loop to work right # so if it was not already absolute, prefix $HOME. $ENV{GL_REPO_BASE_ABS} = ( $REPO_BASE =~ m(^/) ? $REPO_BASE : "$ENV{HOME}/$REPO_BASE" ); unless ($GL_NO_CREATE_REPOS) { wrap_chdir("$ENV{GL_REPO_BASE_ABS}"); # autocreate repos. Start with the ones that are normal repos in %repos my @repos = grep { $_ =~ $REPONAME_PATT and not /^@/ } sort keys %repos; # then, for each repogroup, find the members of the group and add them in map { push @repos, keys %{ $groups{$_} } } grep { /^@/ } keys %repos; # weed out duplicates (the code in the loop below is disk activity!) my %seen = map { $_ => 1 } @repos; @repos = sort keys %seen; for my $repo (sort @repos) { next unless $repo =~ $REPONAME_PATT; next if $repo =~ m(^\@|EXTCMD/); # these are not real repos unless (-d "$repo.git") { print STDERR "creating $repo...\n"; new_repo($repo, "$GL_ADMINDIR/hooks/common"); # new_repo would have chdir'd us away; come back wrap_chdir("$ENV{GL_REPO_BASE_ABS}"); } # when repos are copied over from elsewhere, one had to run easy install # once again to make the new (OS-copied) repo contain the proper update # hook. Perhaps we can make this easier now, and eliminate the easy # install, with a quick check (and a new, empty, "hook" as a sentinel) unless (-l "$repo.git/hooks/gitolite-hooked") { ln_sf("$GL_ADMINDIR/hooks/common", "*", "$repo.git/hooks"); # in case of package install, GL_ADMINDIR is no longer the top cop; # override with the package hooks ln_sf("$GL_PACKAGE_HOOKS/common", "*", "$repo.git/hooks") if $GL_PACKAGE_HOOKS; } } } # ---------------------------------------------------------------------------- # collect repo_patt for each actual repo # ---------------------------------------------------------------------------- # go through each actual repo on disk, and match it to either its own name in # the config (non-wild) or a wild pattern that matches it. Lots of things # later will need this correspondence so we may as well snarf it in one shot my %repo_patts = (); %repo_patts = &collect_repo_patts(\%repos) unless $GL_NO_DAEMON_NO_GITWEB; # NOTE: we're overloading GL_NO_DAEMON_NO_GITWEB to mean "no git config" also. # In fact anything that requires trawling through the existing repos doing # stuff to all of them is skipped if this variable is set. This is primarily # for the Fedora folks, but it should be useful for anyone who has a huge set # of repos and wants to manage gitweb/daemon/etc access via other means (they # typically have the whole thing controlled by a web-app and a database # anyway, and gitolite is only doing the access control and nothing more). # ---------------------------------------------------------------------------- # various updates to all real repos # ---------------------------------------------------------------------------- # ---------------------------------------------------------------------------- # update repo configurations, gitweb description, daemon export-ok, etc # ---------------------------------------------------------------------------- # all these require a "chdir" to the repo, so we club them for efficiency my %projlist = (); # for each real repo (and remember this will be empty, thus skipping all this, # if $GL_NO_DAEMON_NO_GITWEB is on!) for my $repo (keys %repo_patts) { my $repo_patt = $repo_patts{$repo}; # if non-wild, $repo_patt will be eq $repo anyway wrap_chdir("$ENV{GL_REPO_BASE_ABS}/$repo.git"); # git config if ($repo_patt eq $repo or $GL_GITCONFIG_WILD) { # erm, what that means is that it's either a non-wild repo being # config'd or a wild one but gitconfig is allowed on wilds. # XXX do we really need GL_GITCONFIG_WILD now? It was meant to be # only an efficiency thing, but that was before this whole revamp; # we already trawl through $REPO_BASE exactly once now anyway! # ...need to think about this &setup_repo_configs($repo, $repo_patt, \%repo_config) if $repo_config{$repo_patt}; } # daemon is easy &setup_daemon_access($repo, $repos{$repo_patt}{'R'}{'daemon'} || ''); # gitweb is a little more complicated. Here're some notes: # - "setup_gitweb_access" also sets "owner", despite the name # - specifying a description also counts as enabling gitweb # - description and owner are not specified for wildrepos; they're # specified for *actual* repos, even if the repo was created by a # wild card spec and "C" permissions. If you see the # conf/example.conf file, you will see that repo owner/desc don't go # into the "repo foo" section; they're essentialy independent. # Anyway, I believe it doesn't make sense to have all wild repos # (for some pattern) to have the same description and owner. if ($repos{$repo_patt}{'R'}{'gitweb'} or $desc{"$repo.git"}) { $projlist{"$repo.git"} = 1; &setup_gitweb_access($repo, 1, $desc{"$repo.git"} || '', $owner{"$repo.git"} || ''); } else { &setup_gitweb_access($repo, 0, '', ''); } } # write out the project list my $projlist_fh = wrap_open( ">", $PROJECTS_LIST); for my $proj (sort keys %projlist) { print $projlist_fh "$proj\n"; } close $projlist_fh; # ---------------------------------------------------------------------------- # "compile" ssh authorized_keys # ---------------------------------------------------------------------------- unless ($GL_NO_SETUP_AUTHKEYS) { &setup_authkeys($bindir, $GL_KEYDIR, \%user_list); }