summaryrefslogtreecommitdiff
path: root/lib/spack/spack/package.py
blob: 0611d005dbfabba29514805adbf796210bb90e58 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
"""
This is where most of the action happens in Spack.
See the Package docs for detailed instructions on how the class works
and on how to write your own packages.

The spack package structure is based strongly on Homebrew
(http://wiki.github.com/mxcl/homebrew/), mainly because
Homebrew makes it very easy to create packages.  For a complete
rundown on spack and how it differs from homebrew, look at the
README.
"""
import inspect
import os
import re
import subprocess
import platform as py_platform
import shutil

from spack import *
import spack.spec
import packages
import tty
import attr
import validate
import url


from spec import Compiler
from version import *
from multi_function import platform
from stage import Stage


class Package(object):
    """This is the superclass for all spack packages.

    The Package class
    ==================
    Package is where the bulk of the work of installing packages is done.

    A package defines how to fetch, verfiy (via, e.g., md5), build, and
    install a piece of software.  A Package also defines what other
    packages it depends on, so that dependencies can be installed along
    with the package itself.  Packages are written in pure python.

    Packages are all submodules of spack.packages.  If spack is installed
    in $prefix, all of its python files are in $prefix/lib/spack.  Most
    of them are in the spack module, so all the packages live in
    $prefix/lib/spack/spack/packages.

    All you have to do to create a package is make a new subclass of Package
    in this directory.  Spack automatically scans the python files there
    and figures out which one to import when you invoke it.

    An example package
    ====================
    Let's look at the cmake package to start with.  This package lives in
    $prefix/lib/spack/spack/packages/cmake.py:

    from spack import *
    class Cmake(Package):
        homepage  = 'https://www.cmake.org'
        url       = 'http://www.cmake.org/files/v2.8/cmake-2.8.10.2.tar.gz'
        md5       = '097278785da7182ec0aea8769d06860c'

        def install(self, prefix):
            configure('--prefix=%s'   % prefix,
                      '--parallel=%s' % make_jobs)
            make()
            make('install')

    Naming conventions
    ---------------------
    There are two names you should care about:

    1. The module name, 'cmake'.
       - User will refers to this name, e.g. 'spack install cmake'.
       - Corresponds to the name of the file, 'cmake.py', and it can
         include _, -, and numbers (it can even start with a number).

    2. The class name, "Cmake".  This is formed by converting -'s or _'s
       in the module name to camel case.  If the name starts with a number,
       we prefix the class name with 'Num_'. Examples:

         Module Name       Class Name
          foo_bar           FooBar
          docbook-xml       DocbookXml
          FooBar            Foobar
          3proxy            Num_3proxy

        The class name is what spack looks for when it loads a package module.

    Required Attributes
    ---------------------
    Aside from proper naming, here is the bare minimum set of things you
    need when you make a package:
        homepage   informational URL, so that users know what they're
                   installing.

        url        URL of the source archive that spack will fetch.

        md5        md5 hash of the source archive, so that we can
                   verify that it was downloaded securely and correctly.

        install()  This function tells spack how to build and install the
                   software it downloaded.

    Optional Attributes
    ---------------------
    You can also optionally add these attributes, if needed:
        list_url
            Webpage to scrape for available version strings. Default is the
            directory containing the tarball; use this if the default isn't
            correct so that invoking 'spack versions' will work for this
            package.

        url_version(self, version)
            When spack downloads packages at particular versions, it just
            converts version to string with str(version).  Override this if
            your package needs special version formatting in its URL.  boost
            is an example of a package that needs this.

    Creating Packages
    ===================
    As a package creator, you can probably ignore most of the preceding
    information, because you can use the 'spack create' command to do it
    all automatically.

    You as the package creator generally only have to worry about writing
    your install function and specifying dependencies.

    spack create
    ----------------
    Most software comes in nicely packaged tarballs, like this one:
        http://www.cmake.org/files/v2.8/cmake-2.8.10.2.tar.gz

    Taking a page from homebrew, spack deduces pretty much everything it
    needs to know from the URL above.  If you simply type this:

        spack create http://www.cmake.org/files/v2.8/cmake-2.8.10.2.tar.gz

    Spack will download the tarball, generate an md5 hash, figure out the
    version and the name of the package from the URL, and create a new
    package file for you with all the names and attributes set correctly.

    Once this skeleton code is generated, spack pops up the new package in
    your $EDITOR so that you can modify the parts that need changes.

    Dependencies
    ---------------
    If your package requires another in order to build, you can specify that
    like this:

    class Stackwalker(Package):
        ...
        depends_on("libdwarf")
        ...

    This tells spack that before it builds stackwalker, it needs to build
    the libdwarf package as well.  Note that this is the module name, not
    the class name (The class name is really only used by spack to find
    your package).

    Spack will download an install each dependency before it installs your
    package.  In addtion, it will add -L, -I, and rpath arguments to your
    compiler and linker for each dependency.  In most cases, this allows you
    to avoid specifying any dependencies in your configure or cmake line;
    you can just run configure or cmake without any additional arguments and
    it will find the dependencies automatically.


    The Install Function
    ----------------------
    The install function is designed so that someone not too terribly familiar
    with Python could write a package installer.  For example, we put a number
    of commands in install scope that you can use almost like shell commands.
    These include make, configure, cmake, rm, rmtree, mkdir, mkdirp, and others.

    You can see above in the cmake script that these commands are used to run
    configure and make almost like they're used on the command line.  The
    only difference is that they are python function calls and not shell
    commands.

    It may be puzzling to you where the commands and functions in install live.
    They are NOT instance variables on the class; this would require us to
    type 'self.' all the time and it makes the install code unnecessarily long.
    Rather, spack puts these commands and variables in *module* scope for your
    Package subclass.  Since each package has its own module, this doesn't
    pollute other namespaces, and it allows you to more easily implement an
    install function.

    For a full list of commands and variables available in module scope, see the
    add_commands_to_module() function in this class. This is where most of
    them are created and set on the module.


    Parallel Builds
    -------------------
    By default, Spack will run make in parallel when you run make() in your
    install function.  Spack figures out how many cores are available on
    your system and runs make with -j<cores>.  If you do not want this behavior,
    you can explicitly mark a package not to use parallel make:

    class SomePackage(Package):
        ...
        parallel = False
        ...

    This changes thd default behavior so that make is sequential.  If you still
    want to build some parts in parallel, you can do this in your install function:

        make(parallel=True)

    Likewise, if you do not supply parallel = True in your Package, you can keep
    the default parallel behavior and run make like this when you want a
    sequential build:

        make(parallel=False)

    Package Lifecycle
    ==================
    This section is really only for developers of new spack commands.

    A package's lifecycle over a run of Spack looks something like this:

        p = Package()             # Done for you by spack

        p.do_fetch()              # called by spack commands in spack/cmd.
        p.do_stage()              # see spack.stage.Stage docs.
        p.do_install()            # calls package's install() function
        p.do_uninstall()

    There are also some other commands that clean the build area:
        p.do_clean()              # runs make clean
        p.do_clean_work()         # removes the build directory and
                                  # re-expands the archive.
        p.do_clean_dist()         # removes the stage directory entirely

    The convention used here is that a do_* function is intended to be called
    internally by Spack commands (in spack.cmd).  These aren't for package
    writers to override, and doing so may break the functionality of the Package
    class.

    Package creators override functions like install() (all of them do this),
    clean() (some of them do this), and others to provide custom behavior.
    """

    #
    # These variables are per-package metadata will be defined by subclasses.
    #
    """By default a package has no dependencies."""
    dependencies = []

    #
    # These are default values for instance variables.
    #
    """By default we build in parallel.  Subclasses can override this."""
    parallel = True

    """Remove tarball and build by default.  If this is true, leave them."""
    dirty = False

    """Controls whether install and uninstall check deps before running."""
    ignore_dependencies = False

    def __init__(self, spec):
        # These attributes are required for all packages.
        attr.required(self, 'homepage')
        attr.required(self, 'url')
        attr.required(self, 'md5')

        # this determines how the package should be built.
        self.spec = spec

        # Name of package is the name of its module (the file that contains it)
        self.name = inspect.getmodulename(self.module.__file__)

        # Don't allow the default homepage.
        if re.search(r'example.com', self.homepage):
            tty.die("Bad homepage in %s: %s" % (self.name, self.homepage))

        # Make sure URL is an allowed type
        validate.url(self.url)

        # Set up version
        if not hasattr(self, 'version'):
            try:
                self.version = url.parse_version(self.url)
            except UndetectableVersionError:
                tty.die("Couldn't extract a default version from %s. You " +
                        "must specify it explicitly in the package." % self.url)
        elif type(self.version) == string:
            self.version = Version(self.version)

        # Empty at first; only compute dependent packages if necessary
        self._dependents = None

        # This is set by scraping a web page.
        self._available_versions = None

        # stage used to build this package.
        self.stage = Stage("%s-%s" % (self.name, self.version), self.url)

        # Set a default list URL (place to find available versions)
        if not hasattr(self, 'list_url'):
            self.list_url = os.path.dirname(self.url)


    def add_commands_to_module(self):
        """Populate the module scope of install() with some useful functions.
           This makes things easier for package writers.
        """
        m = self.module

        m.make  = MakeExecutable('make', self.parallel)
        m.gmake = MakeExecutable('gmake', self.parallel)

        # number of jobs spack prefers to build with.
        m.make_jobs = multiprocessing.cpu_count()

        # Find the configure script in the archive path
        # Don't use which for this; we want to find it in the current dir.
        m.configure = Executable('./configure')
        m.cmake = which("cmake")

        # standard CMake arguments
        m.std_cmake_args = ['-DCMAKE_INSTALL_PREFIX=%s' % self.prefix,
                            '-DCMAKE_BUILD_TYPE=None']
        if py_platform.mac_ver()[0]:
            m.std_cmake_args.append('-DCMAKE_FIND_FRAMEWORK=LAST')

        # Emulate some shell commands for convenience
        m.cd         = os.chdir
        m.mkdir      = os.mkdir
        m.makedirs   = os.makedirs
        m.remove     = os.remove
        m.removedirs = os.removedirs

        m.mkdirp     = mkdirp
        m.install    = install
        m.rmtree     = shutil.rmtree
        m.move       = shutil.move

        # Useful directories within the prefix
        m.prefix  = self.prefix
        m.bin     = new_path(self.prefix, 'bin')
        m.sbin    = new_path(self.prefix, 'sbin')
        m.etc     = new_path(self.prefix, 'etc')
        m.include = new_path(self.prefix, 'include')
        m.lib     = new_path(self.prefix, 'lib')
        m.lib64   = new_path(self.prefix, 'lib64')
        m.libexec = new_path(self.prefix, 'libexec')
        m.share   = new_path(self.prefix, 'share')
        m.doc     = new_path(m.share, 'doc')
        m.info    = new_path(m.share, 'info')
        m.man     = new_path(m.share, 'man')
        m.man1    = new_path(m.man, 'man1')
        m.man2    = new_path(m.man, 'man2')
        m.man3    = new_path(m.man, 'man3')
        m.man4    = new_path(m.man, 'man4')
        m.man5    = new_path(m.man, 'man5')
        m.man6    = new_path(m.man, 'man6')
        m.man7    = new_path(m.man, 'man7')
        m.man8    = new_path(m.man, 'man8')

    @property
    def dependents(self):
        """List of names of packages that depend on this one."""
        if self._dependents is None:
            packages.compute_dependents()
        return tuple(self._dependents)


    def sanity_check(self):
        """Ensure that this package and its dependencies don't have conflicting
           requirements."""
        deps = sorted(self.all_dependencies, key=lambda d: d.name)



    @property
    @memoized
    def all_dependencies(self):
        """Set of all transitive dependencies of this package."""
        all_deps = set(self.dependencies)
        for dep in self.dependencies:
            dep_pkg = packages.get(dep.name)
            all_deps = all_deps.union(dep_pkg.all_dependencies)
        return all_deps


    @property
    def installed(self):
        return os.path.exists(self.prefix)


    @property
    def installed_dependents(self):
        installed = [d for d in self.dependents if packages.get(d).installed]
        all_deps = []
        for d in installed:
            all_deps.append(d)
            all_deps.extend(packages.get(d).installed_dependents)
        return tuple(all_deps)


    @property
    def all_dependents(self):
        all_deps = list(self.dependents)
        for pkg in self.dependents:
            all_deps.extend(packages.get(pkg).all_dependents)
        return tuple(all_deps)


    @property
    def prefix(self):
        """Get the prefix into which this package should be installed."""
        return spack.install_layout.path_for_spec(self.spec)


    def url_version(self, version):
        """Given a version, this returns a string that should be substituted into the
           package's URL to download that version.
           By default, this just returns the version string. Subclasses may need to
           override this, e.g. for boost versions where you need to ensure that there
           are _'s in the download URL.
        """
        return str(version)


    def remove_prefix(self):
        """Removes the prefix for a package along with any empty parent directories."""
        if self.dirty:
            return
        spack.install_layout.remove_path_for_spec(self.spec)


    def do_fetch(self):
        """Creates a stage directory and downloads the taball for this package.
           Working directory will be set to the stage directory.
        """
        stage = self.stage
        stage.setup()
        stage.fetch()

        archive_md5 = md5(stage.archive_file)
        if archive_md5 != self.md5:
            tty.die("MD5 Checksum failed for %s.  Expected %s but got %s."
                    % (self.name, self.md5, archive_md5))


    def do_stage(self):
        """Unpacks the fetched tarball, then changes into the expanded tarball directory."""
        self.do_fetch()
        stage = self.stage

        archive_dir = stage.expanded_archive_path
        if not archive_dir:
            tty.msg("Staging archive: %s" % stage.archive_file)
            stage.expand_archive()
        else:
            tty.msg("Already staged %s" % self.name)
        stage.chdir_to_archive()


    def do_install(self):
        """This class should call this version of the install method.
           Package implementations should override install().
        """
        if not self.spec.concrete:
            raise ValueError("Can only install concrete packages.")

        if os.path.exists(self.prefix):
            tty.msg("%s is already installed." % self.name)
            tty.pkg(self.prefix)
            return

        if not self.ignore_dependencies:
            self.do_install_dependencies()

        self.do_stage()
        self.setup_install_environment()

        # Add convenience commands to the package's module scope to
        # make building easier.
        self.add_commands_to_module()

        tty.msg("Building %s." % self.name)
        try:
            self.install(self.prefix)
            if not os.path.isdir(self.prefix):
                tty.die("Install failed for %s.  No install dir created." % self.name)

        except subprocess.CalledProcessError, e:
            self.remove_prefix()
            tty.die("Install failed for %s" % self.name, e.message)

        except KeyboardInterrupt, e:
            self.remove_prefix()
            raise

        except Exception, e:
            if not self.dirty:
                self.remove_prefix()
            raise

        tty.msg("Successfully installed %s" % self.name)
        tty.pkg(self.prefix)

        # Once the install is done, destroy the stage where we built it,
        # unless the user wants it kept around.
        if not self.dirty:
            self.stage.destroy()


    def setup_install_environment(self):
        """This ensures a clean install environment when we build packages."""
        pop_keys(os.environ, "LD_LIBRARY_PATH", "LD_RUN_PATH", "DYLD_LIBRARY_PATH")

        # Add spack environment at front of path and pass the
        # lib location along so the compiler script can find spack
        os.environ[SPACK_LIB] = lib_path

        # Fix for case-insensitive file systems.  Conflicting links are
        # in directories called "case*" within the env directory.
        env_paths = [env_path]
        for file in os.listdir(env_path):
            path = new_path(env_path, file)
            if file.startswith("case") and os.path.isdir(path):
                env_paths.append(path)
        path_put_first("PATH", env_paths)
        path_set(SPACK_ENV_PATH, env_paths)

        # Pass along prefixes of dependencies here
        path_set(SPACK_DEPENDENCIES,
                 [dep.package.prefix for dep in self.dependencies])

        # Install location
        os.environ[SPACK_PREFIX] = self.prefix

        # Build root for logging.
        os.environ[SPACK_BUILD_ROOT] = self.stage.expanded_archive_path


    def do_install_dependencies(self):
        # Pass along paths of dependencies here
        for dep in self.dependencies:
            dep.package.do_install()


    @property
    def module(self):
        """Use this to add variables to the class's module's scope.
           This lets us use custom syntax in the install method.
        """
        return __import__(self.__class__.__module__,
                          fromlist=[self.__class__.__name__])


    def install(self, prefix):
        """Package implementations override this with their own build configuration."""
        tty.die("Packages must provide an install method!")


    def do_uninstall(self):
        if not os.path.exists(self.prefix):
            tty.die(self.name + " is not installed.")

        if not self.ignore_dependencies:
            deps = self.installed_dependents
            if deps: tty.die(
                "Cannot uninstall %s. The following installed packages depend on it:"
                % self.name, " ".join(deps))

        self.remove_prefix()
        tty.msg("Successfully uninstalled %s." % self.name)


    def do_clean(self):
        if self.stage.expanded_archive_path:
            self.stage.chdir_to_archive()
            self.clean()


    def clean(self):
        """By default just runs make clean.  Override if this isn't good."""
        try:
            make = MakeExecutable('make', self.parallel)
            make('clean')
            tty.msg("Successfully cleaned %s" % self.name)
        except subprocess.CalledProcessError, e:
            tty.warn("Warning: 'make clean' didn't work.  Consider 'spack clean --work'.")


    def do_clean_work(self):
        """By default just blows away the stage directory and re-stages."""
        self.stage.restage()


    def do_clean_dist(self):
        """Removes the stage directory where this package was built."""
        if os.path.exists(self.stage.path):
            self.stage.destroy()
        tty.msg("Successfully cleaned %s" % self.name)


    @property
    def available_versions(self):
        if not self._available_versions:
            self._available_versions = VersionList()
            try:
                # Run curl but grab the mime type from the http headers
                listing = spack.curl('-s', '-L', self.list_url, return_output=True)
                url_regex = os.path.basename(url.wildcard_version(self.url))
                strings = re.findall(url_regex, listing)
                wildcard = self.version.wildcard()
                for s in strings:
                    match = re.search(wildcard, s)
                    if match:
                        self._available_versions.add(ver(match.group(0)))

            except CalledProcessError:
                tty.warn("Fetching %s failed." % self.list_url,
                         "Package.available_versions requires an internet connection.",
                         "Version list may be incomplete.")

            if not self._available_versions:
                tty.warn("Found no versions for %s" % self.name,
                         "Packate.available_versions may require adding the list_url attribute",
                         "to the package to tell Spack where to look for versions.")
                self._available_versions = [self.version]
        return self._available_versions


class MakeExecutable(Executable):
    """Special Executable for make so the user can specify parallel or
       not on a per-invocation basis.  Using 'parallel' as a kwarg will
       override whatever the package's global setting is, so you can
       either default to true or false and override particular calls.

       Note that if the SPACK_NO_PARALLEL_MAKE env var is set it overrides
       everything.
    """
    def __init__(self, name, parallel):
        super(MakeExecutable, self).__init__(name)
        self.parallel = parallel

    def __call__(self, *args, **kwargs):
        parallel = kwargs.get('parallel', self.parallel)
        disable_parallel = env_flag(SPACK_NO_PARALLEL_MAKE)

        if parallel and not disable_parallel:
            jobs = "-j%d" % multiprocessing.cpu_count()
            args = (jobs,) + args

        super(MakeExecutable, self).__call__(*args, **kwargs)