aboutsummaryrefslogtreecommitdiffstats
path: root/src/blogc-github-lambda/lambda_function.py
blob: 5a3bf5ef8836b727d27c08de3948f56bce6be606 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
# coding: utf-8
"""
  blogc: A blog compiler.
  Copyright (C) 2016 Rafael G. Martins <rafael@rafaelmartins.eng.br>

  This program can be distributed under the terms of the BSD License.
  See the file LICENSE.
"""

from contextlib import closing
from StringIO import StringIO

import base64
import boto3
import hashlib
import json
import mimetypes
import os
import subprocess
import sys
import tarfile
import urllib2
import shutil

cwd = os.path.dirname(os.path.abspath(__file__))

GITHUB_AUTH = os.environ.get('GITHUB_AUTH')
if GITHUB_AUTH is not None and ':' not in GITHUB_AUTH:
    GITHUB_AUTH = boto3.client('kms').decrypt(
        CiphertextBlob=base64.b64decode(GITHUB_AUTH))['Plaintext']


def get_tarball(repo_name):
    tarball_url = 'https://api.github.com/repos/%s/tarball/master' % repo_name
    request = urllib2.Request(tarball_url)

    if GITHUB_AUTH is not None:
        auth = base64.b64encode(GITHUB_AUTH)
        request.add_header("Authorization", "Basic %s" % auth)

    with closing(urllib2.urlopen(request)) as fp:
        tarball = fp.read()

    rootdir = None
    with closing(StringIO(tarball)) as fp:
        with tarfile.open(fileobj=fp, mode='r:gz') as tar:
            for f in tar.getnames():
                if '/' not in f:
                    rootdir = f
                    break
            if rootdir is None:
                raise RuntimeError('Failed to find a directory in tarball')
            rootdir = '/tmp/%s' % rootdir

            if os.path.isdir(rootdir):
                shutil.rmtree(rootdir)

            tar.extractall('/tmp/')

    return rootdir


def translate_filename(filename):
    f = filename.split('/')
    if len(f) == 0:
        return filename
    basename = f[-1]

    # replace any index.$EXT file with index.html, because s3 only allows
    # users to declare one directory index file name.
    p = basename.split('.')
    if len(p) == 2 and p[0] == 'index':
        f[-1] = 'index.html'
        return '/'.join(f)

    return filename


def sync_s3(src, dest, settings_file):
    s3 = boto3.resource('s3')
    bucket = s3.Bucket(dest)

    remote_files = {}
    for obj in bucket.objects.all():
        if not obj.key.endswith('/'):
            remote_files[obj.key] = obj

    local_files = {}
    for root, dirs, files in os.walk(src):
        real_root = root[len(src):].lstrip('/')
        for file in files:
            f = os.path.join(real_root, file)
            local_files[translate_filename(f)] = f

    to_upload = []
    for file in local_files:
        if file not in remote_files:
            to_upload.append(local_files[file])

    to_delete = []
    for file in remote_files:
        if file in local_files:
            with open(os.path.join(src, local_files[file])) as fp:
                l = hashlib.sha1(fp.read())

            with closing(remote_files[file].get()['Body']) as fp:
                r = hashlib.sha1(fp.read())

            if l.hexdigest() != r.hexdigest():
                to_upload.append(local_files[file])
        else:
            to_delete.append(file)

    content_types = {}
    if os.path.exists(settings_file):
        with open(settings_file, 'r') as fp:
            settings = json.load(fp)
            content_types = settings.get('content-type', {})

    for file in to_upload:
        with open(os.path.join(src, file), 'rb') as fp:
            mime = content_types.get(file, mimetypes.guess_type(file)[0])
            file = translate_filename(file)
            print 'Uploading file: %s; content-type: "%s"' % (file, mime)
            if mime is not None:
                bucket.put_object(Key=file, Body=fp, ContentType=mime)
            else:
                bucket.put_object(Key=file, Body=fp)

    for file in to_delete:
        print 'Deleting file:', file
        remote_files[file].delete()


def lambda_handler(event, context):
    message = event['Records'][0]['Sns']['Message']
    payload = json.loads(message)

    debug = 'DEBUG' in os.environ

    if payload['ref'] == 'refs/heads/master':
        repo_name = payload['repository']['name']
        repo_full_name = payload['repository']['full_name']
        rootdir = get_tarball(repo_full_name)
        rv = subprocess.call(['make', '-C', rootdir, 'OUTPUT_DIR=_build',
                              'BLOGC=%s' % os.path.join(cwd, 'blogc')],
                             stdout=None if debug else subprocess.PIPE,
                             stderr=None if debug else subprocess.PIPE)
        if rv != 0:
            raise RuntimeError('Failed to run make')
        sync_s3(os.path.join(rootdir, '_build'), repo_name,
                os.path.join(rootdir, 's3.json'))