source: trunk/server/doc/install-howto.sh @ 2090

Last change on this file since 2090 was 2080, checked in by ezyang, 13 years ago
Information on how to reenable password SSH.
File size: 16.8 KB
RevLine 
[1058]1# This document is a how-to for installing a Fedora scripts.mit.edu server.
[1693]2# It is semi-vaguely in the form of a shell script, but is not really
3# runnable as it stands.
[181]4
[1961]5# Notation
6# [PRODUCTION] Production server that will be put into the pool
7# [WIZARD]     Semi-production server that will only have
8#              daemon.scripts-security-upd bits, among other
9#              restricted permissions
10# [TESTSERVER] Completely untrusted server
11
[1693]12# 'branch' is the current svn branch you are on.  You want to
13# use trunk if your just installing a new server, and branches/fcXX-dev
14# if your preparing a server on a new Fedora release.
15branch="trunk"
[1063]16
[1693]17# 'server' is the public hostname of your server, for SCP'ing files
18# to and from.
19server=YOUR-SERVER-NAME-HERE
[1063]20
[2066]21# ----------------------------->8--------------------------------------
22#                       FIRST TIME INSTRUCTIONS
23#
[1961]24# [PRODUCTION] If this is the first time you've installed this hostname,
25# you will need to update a bunch of files to add support for it. These
26# include:
[1696]27#   o Adding all aliases to /etc/httpd/conf.d/scripts-vhost-names.conf
28#     (usually this is hostname, hostname.mit.edu, h-n, h-n.mit.edu,
29#     scriptsN, scriptsN.mit.edu, and the IP address.)
30#   o Adding routing rules for the static IP in
31#     /etc/sysconfig/network-scripts/route-eth1
32#   o Adding the IP address to the hosts file (same hosts as for
33#     scripts-vhost-names)
[1704]34#   o Update SSH config at
35#       - server/fedora/config/etc/ssh/shosts.equiv
36#       - server/fedora/config/etc/ssh/ssh_known_hosts
37#       - server/fedora/config/etc/ssh/sshd_config : DenyUsers
38#     (the last part is critical to ensure that rooting one server
39#     doesn't give you root to all the other servers)
[1696]40#   o Put the hostname information in LDAP so SVN and Git work
41#   o Set up Nagios monitoring on sipb-noc for the host
42#   o Set up the host as in the pool on r-b/r-b /etc/heartbeat/ldirectord.cf
[2066]43#   o Update locker/etc/known_hosts
[2068]44#   o Update website files:
45#       /mit/scripts/web_scripts/home/server.css.cgi
46#       /mit/scripts/web_scripts/heartbeat/heartbeat.php
[2066]47#
48# You will also need to prepare the keytabs for credit-card.  In particular,
49# use ktutil to combine the host/scripts.mit.edu and
50# host/scripts-vhosts.mit.edu keys with host/this-server.mit.edu in
51# the keytab.  Do not use 'k5srvutil change' on the combined keytab
52# or you'll break the other servers. (real servers only).  Be
53# careful about writing out the keytab: if you write it to an
54# existing file the keys will just get appended.  The correct
55# credential list should look like:
56#   ktutil:  l
57#   slot KVNO Principal
58#   ---- ---- ---------------------------------------------------------------------
59#      1    5 host/old-faithful.mit.edu@ATHENA.MIT.EDU
60#      2    3 host/scripts-vhosts.mit.edu@ATHENA.MIT.EDU
[2068]61#      3    2 host/scripts.mit.edu@ATHENA.MIT.EDU
62#      4    8 host/scripts-test.mit.edu@ATHENA.MIT.EDU
[2066]63#
64# The LDAP keytab should be by itself, so be sure to delete it and
65# put it in its own file.
[1696]66
[2066]67# ----------------------------->8--------------------------------------
68#                      INFINITE INSTALLATION
[1259]69
[2066]70# Start with a Scripts kickstarted install of Fedora (install-fedora)
[1259]71
[2079]72# IMPORTANT: If you are installing a server without the benefit of
73# Kickstart (for example, you are installing on XVM, it is VITALLY
74# IMPORTANT that you go through the kickstart and apply all of the
75# necessary changes--for example, disabling selinux or enabling
76# network.)
77#   XXX We should make Kickstart work for test servers too
78
[2066]79# Take updates, reboot if there's a kernel update.
80    yum update -y
81
82# Get rid of network manager (XXX figure out to make kickstarter do
83# this for us)
84    yum remove NetworkManager
85
86# Make sure sendmail isn't installed
87    yum remove sendmail
88
89# Check out the scripts /etc configuration
90    cd /root
91    \cp -a etc /
92    chmod 0440 /etc/sudoers
93
[2080]94# [TEST] You'll need to fix some config now.  See bottom of document.
95
[2066]96# Make sure network is working.  Kickstart should have
[1693]97# configured eth0 and eth1 correctly; use service network restart
[2066]98# to add the new routes from etc in route-eth1.
99    systemctl restart network.service
100    # Check everything worked:
[1693]101    route
102    ifconfig
103    cat /etc/hosts
104    cat /etc/sysconfig/network-scripts/route-eth1
[1259]105
[1693]106# This is the point at which you should start updating scriptsified
107# packages for a new Fedora release.  Consult 'upgrade-tips' for more
108# information.
109    yum install -y scripts-base
110    # Some of these packages are naughty and clobber some of our files
111    cd /etc
[2066]112    svn revert resolv.conf hosts sysconfig/openafs nsswitch.conf
[2079]113    # Troubleshooting: if accountadm, tokensys and nscd fail to install
114    # you probably forgot to turn off selinux
[1259]115
[1058]116# Replace rsyslog with syslog-ng by doing:
[1259]117    rpm -e --nodeps rsyslog
[1693]118    yum install -y syslog-ng
[2066]119    systemctl enable syslog-ng.service
[861]120
[1058]121# Install the full list of RPMs that users expect to be on the
[1259]122# scripts.mit.edu servers.
123rpm -qa --queryformat "%{Name}.%{Arch}\n" | sort > packages.txt
124# arrange for packages.txt to be passed to the server, then run:
[1693]125# --skip-broken will (usually) prevent you from having to sit through
126# several minutes of dependency resolution until it decides that
127# it can't install /one/ package.
128    yum install -y --skip-broken $(cat packages.txt)
[1259]129
[1190]130# Check which packages are installed on your new server that are not
131# in the snapshot, and remove ones that aren't needed for some reason
132# on the new machine.  Otherwise, aside from bloat, you may end up
133# with undesirable things for security, like sendmail.
[1693]134    rpm -qa --queryformat "%{Name}.%{Arch}\n" | grep -v kernel | sort > newpackages.txt
135    diff -u packages.txt newpackages.txt | grep -v kernel | less
[1382]136    # here's a cute script that removes all extra packages
[1693]137    yum erase -y $(grep -Fxvf packages.txt newpackages.txt)
[1961]138    # 20101208 - Mysteriously we manage to get these extra packages
139    # from kickstart: mcelog mobile-broadband-provider-info
140    # ModemManager PackageKit
[1190]141
[1693]142# We need an upstream version of cgi which we've packaged ourselves, but
143# it doesn't work with the haskell-platform package which expects
144# explicit versions.  So temporarily rpm -e the package, and then
145# install it again after you install haskell-platform.  [Note: You
[2066]146# probably won't need this in Fedora 17 or something, when the Haskell
[2079]147# Platform gets updated.] [It's not obvious to me that this actually
148# works]
[1693]149    rpm -e ghc-cgi-devel ghc-cgi
150    yum install -y haskell-platform
151    yumdownloader ghc-cgi
152    yumdownloader ghc-cgi-devel
[2068]153    rpm -i ghc-cgi*1.8.2*.rpm
[1693]154
[2066]155# ----------------------------->8--------------------------------------
156#                      SPHEROID SHENANIGANS
[1237]157
[2066]158# Note: Since ultimately we'd like to move away from using per-language
159# package manager and all of these be RPMs, it is of questionable
160# importance how much /good/ automation for these is necessary.
161
162# Warning: For a new release, we're supposed to check if Fedora has
163# packaged up the RPM.  Unfortunately we don't really have good incants
164# for this.
165
[1058]166# Install the full list of perl modules that users expect to be on the
[1108]167# scripts.mit.edu servers.
[1693]168    cd /root
[1259]169    export PERL_MM_USE_DEFAULT=1
[1693]170    cpan # this is interactive, enter the next two lines
[1259]171        o conf prerequisites_policy follow
172        o conf commit
173# on a reference server
174perldoc -u perllocal | grep head2 | cut -f 3 -d '<' | cut -f 1 -d '|' | sort -u | perl -ne 'chomp; print "notest install $_\n" if system("rpm -q --whatprovides \"perl($_)\" >/dev/null 2>/dev/null")' > perl-packages.txt
175# arrange for perl-packages.txt to be transferred to server
176    cat perl-packages.txt | perl -MCPAN -e shell
[812]177
[1058]178# Install the Python eggs and Ruby gems and PEAR/PECL doohickeys that are on
179# the other scripts.mit.edu servers and do not have RPMs.
[1259]180# The general mode of operation will be to run the "list" command
181# on both servers, see what the differences are, check if those diffs
182# are packaged up as rpms, and install them (rpm if possible, native otherwise)
[1178]183# - Look at /usr/lib/python2.6/site-packages and
184#           /usr/lib64/python2.6/site-packages for Python eggs and modules.
[1259]185#   There will be a lot of gunk that was installed from packages;
[1693]186#   easy-install.pth in /usr/lib/ will tell you what was easy_installed.
[1178]187#   First use 'yum search' to see if the relevant package is now available
188#   as an RPM, and install that if it is.  If not, then use easy_install.
[1432]189#   Pass -Z to easy_install to install them unzipped, as some zipped eggs
190#   want to be able to write to ~/.python-eggs.  (Also makes sourcediving
191#   easier.)
[2066]192# 'easy_install AuthKit jsonlib2 pygit'
193cat /usr/lib/python2.7/site-packages/easy-install.pth | grep "^./" | cut -c3- | cut -f1 -d- > egg.txt
[1698]194    cat egg.txt | xargs easy_install -Z
[2066]195
[1058]196# - Look at `gem list` for Ruby gems.
[1178]197#   Again, use 'yum search' and prefer RPMs, but failing that, 'gem install'.
[1259]198#       ezyang: rspec-rails depends on rspec, and will override the Yum
199#       package, so... don't use that RPM yet
[2066]200# XXX This doesn't do the right thing for old version gems
[1693]201gem list --no-version > gem.txt
202    gem install $(gem list --no-version | grep -Fxvf - gem.txt)
[2066]203    # Also, we need to install the old rails version
204    gem install -v=2.3.5 rails
205
[1058]206# - Look at `pear list` for Pear fruits (or whatever they're called).
[1178]207#   Yet again, 'yum search' for RPMs before resorting to 'pear install'.  Note
208#   that for things in the beta repo, you'll need 'pear install package-beta'.
[1259]209#   (you might get complaints about the php_scripts module; ignore them)
[1693]210pear list | tail -n +4 | cut -f 1 -d " " > pear.txt
211    pear config-set preferred_state beta
212    pear channel-update pear.php.net
213    pear install $(pear list | tail -n +4 | cut -f 1 -d " " | grep -Fxvf - pear.txt)
[2066]214
[1190]215# - Look at `pecl list` for PECL things.  'yum search', and if you must,
[1462]216#   'pecl install' needed items. If it doesn't work, try 'pear install
[1544]217#   pecl/foo' or 'pecl install foo-beta' or those two combined.
[1693]218pecl list | tail -n +4 | cut -f 1 -d " " > pecl.txt
219    pecl install --nodeps $(pecl list | tail -n +4 | cut -f 1 -d " " | grep -Fxvf - pecl.txt)
[785]220
[2066]221# ----------------------------->8--------------------------------------
222#                       INFINITE CONFIGURATION
[812]223
[2066]224# Create fedora-ds user (needed for credit-card)
225useradd -u 103 -r -d /var/lib/dirsrv fedora-ds
[387]226
[2066]227# Run credit-card to clone in credentials and make things runabble
228python host.py push $server
[1961]229
[2066]230# This is superseded by credit-card, but only for [PRODUCTION]
231# Don't use credit-card on [WIZARD]: it will put in the wrong creds!
232#
233#   # All types of servers will have an /etc/daemon.keytab file, however,
234#   # different types of server will have different credentials in this
235#   # keytab.
236#   #   [PRODUCTION] daemon.scripts
237#   #   [WIZARD]     daemon.scripts-security-upd
238#   #   [TESTSERVER] daemon.scripts-test
[1693]239
[2066]240# [PRODUCTION/WIZARD] Fix the openafs /usr/vice/etc <-> /etc/openafs
241# mapping.
242    echo "/afs:/usr/vice/cache:10000000" > /usr/vice/etc/cacheinfo
243    echo "athena.mit.edu" > /usr/vice/etc/ThisCell
244# [TESTSERVER] If you're installing a test server, this needs to be
245# much smaller; the max filesize on XVM is 10GB.  Pick something like
246# 500000. Also, some of the AFS parameters are kind of retarded (and if
247# you're low on disk space, will actually exhaust our inodes).  Edit
[2068]248# these parameters in /etc/sysconfig/openafs (This doesn't work in the
249# new systemd world order: try editing the unit file instead.)
[2066]250    echo "/afs:/usr/vice/cache:500000" > /usr/vice/etc/cacheinfo
251    vim /etc/sysconfig/openafs
[562]252
[2066]253# Test that zephyr is working
254    systemctl enable zhm.service
255    systemctl start zhm.service
256    echo 'Test!' | zwrite -d -c scripts -i test
[1259]257
[2066]258# Check out the scripts /usr/vice/etc configuration
259    cd /root/vice
260    \cp -a etc /usr/vice
261
[1961]262# [PRODUCTION] Set up replication (see ./install-ldap).
[1693]263# You'll need the LDAP keytab for this server: be sure to chown it
264# fedora-ds after you create the fedora-ds user
265    ls -l /etc/dirsrv/keytab
266    cat install-ldap
[785]267
[2066]268# Enable lots of services
269    systemctl enable openafs-client.service
270    systemctl enable dirsrv.service
271    systemctl enable nslcd.service
272    systemctl enable nscd.service
273    systemctl enable postfix.service
274    systemctl enable nrpe.service
275    systemctl enable httpd.service # not for [WIZARD]
[1961]276
[2066]277    systemctl start openafs-client.service
278    systemctl start dirsrv.service
279    systemctl start nslcd.service
280    systemctl start nscd.service
281    systemctl start postfix.service
282    systemctl start nrpe.service
283    systemctl start httpd.service # not for [WIZARD]
[1961]284
[2066]285# Note about OpenAFS: Check that fs sysname is correct.  You should see,
286# among others, 'amd64_fedoraX_scripts' (vary X) and 'scripts'. If it's
287# not, you probably did a distro upgrade and should update
288# /etc/sysconfig/openafs (XXX this is wrong: figuring out new
289# systemd world order).
290    fs sysname
[818]291
[1259]292# Postfix doesn't actually deliver mail; fix this
293    cd /etc/postfix
294    postmap virtual
[1178]295
[1451]296# Munin might not be monitoring packages that were installed after it
297    munin-node-configure --suggest --shell | sh
298
[1058]299# Run fmtutil-sys --all, which does something that makes TeX work.
[1693]300# (Note: this errors on XeTeX which is ok.)
[1259]301    fmtutil-sys --all
[803]302
[1058]303# Ensure that PHP isn't broken:
[1259]304    mkdir /tmp/sessions
305    chmod 01777 /tmp/sessions
[1699]306    # XXX: this seems to get deleted if tmp gets cleaned up, so we
307    # might need something a little better (maybe init script.)
[954]308
[1259]309# Fix etc by making sure none of our config files got overwritten
310    cd /etc
[1693]311    svn status -q
[2066]312    # Some usual candidates for clobbering include nsswitch.conf,
313    # resolv.conf and sysconfig/openafs
[1961]314    # [WIZARD/TEST] Remember that changes you made should not get
315    # reverted!
[1259]316
[1058]317# Reboot the machine to restore a consistent state, in case you
[1693]318# changed anything. (Note: Starting kdump fails (this is ok))
[875]319
[2066]320# ------------------------------->8-------------------------------
321#                ADDENDA AND MISCELLANEOUS THINGS
322
[1693]323# [OPTIONAL] Your machine's hostname is baked in at install time;
324# in the rare case you need to change it: it appears to be in:
[1259]325#   o /etc/sysconfig/network
326#   o your lvm thingies; probably don't need to edit
[1382]327
[2080]328# [TESTSERVER] Enable password log in
329        vim /etc/ssh/sshd_config
330        service sshd reload
331        vim /etc/pam.d/sshd
332# Replace the first auth block with:
333#           # If they're not root, but their user exists (success),
334#           auth    [success=ignore ignore=ignore default=1]        pam_succeed_if.so uid > 0
335#           # print the "You don't have tickets" error:
336#           auth    [success=die ignore=reset default=die]  pam_echo.so file=/etc/issue.net.no_tkt
337#           # If !(they are root),
338#           auth    [success=1 ignore=ignore default=ignore]        pam_succeed_if.so uid eq 0
339#           # print the "your account doesn't exist" error:
340#           auth    [success=die ignore=reset default=die]  pam_echo.so file=/etc/issue.net.no_user
341
342
[2066]343# [WIZARD/TESTSERVER] If you are setting up a non-production server,
344# there are some services that it won't provide, and you will need to
345# make it talk to a real server instead.  In particular:
346#   - We don't serve the web, so don't bind scripts.mit.edu
347#   - We don't serve LDAP, so use another server
348# This involves editing the following files:
[2080]349        \rm /etc/sysconfig/network-scripts/ifcfg-lo:{0,1,2,3}
350        \rm /etc/sysconfig/network-scripts/route-eth1 # [TESTSERVER] only
[2079]351#   o /etc/nslcd.conf
[2066]352#       replace: uri ldapi://%2fvar%2frun%2fdirsrv%2fslapd-scripts.socket/
353#       with: uri ldap://scripts.mit.edu/
[2079]354#           (what happened to nss-ldapd?)
[2066]355#   o /etc/openldap/ldap.conf
356#       add: URI ldap://scripts.mit.edu/
357#            BASE dc=scripts,dc=mit,dc=edu
358#   o /etc/httpd/conf.d/vhost_ldap.conf
359#       replace: VhostLDAPUrl "ldap://127.0.0.1/ou=VirtualHosts,dc=scripts,dc=mit,dc=edu"
360#       with: VhostLDAPUrl "ldap://scripts.mit.edu/ou=VirtualHosts,dc=scripts,dc=mit,dc=edu"
361#   o /etc/postfix/virtual-alias-{domains,maps}-ldap.cf
362#       replace: server_host ldapi://%2fvar%2frun%2fdirsrv%2fslapd-scripts.socket/
363#       with: server_host = ldap://scripts.mit.edu
364# to use scripts.mit.edu instead of localhost.
365# XXX: someone should write sed scripts to do this
366
367# [WIZARD/TESTSERVER] If you are setting up a non-production server,
368# afsagent's cronjob will attempt to be renewing with the wrong
369# credentials (daemon.scripts). Change this:
370    vim /home/afsagent/renew # replace all mentions of daemon.scripts.mit.edu
371
[1961]372# [TESTERVER]
373#   - You need a self-signed SSL cert or Apache will refuse to start
374#     or do SSL.  Generate with:
[1382]375    openssl req -new -x509 -keyout /etc/pki/tls/private/scripts.key -out /etc/pki/tls/certs/scripts.cert -nodes
[1961]376#     Also make /etc/pki/tls/certs/ca.pem match up (XXX what's the
377#     incant for that?)
378
379# [TESTSERVER] More stuff for test servers
[1382]380#   - Make (/etc/aliases) root mail go to /dev/null, so we don't spam people
381#   - Edit /etc/httpd/conf.d/scripts-vhost-names.conf to have scripts-fX-test.xvm.mit.edu
382#     be an accepted vhost name
383#   - Look at the old test server and see what config changes are floating around
Note: See TracBrowser for help on using the repository browser.