launchpad-reviewers team mailing list archive
-
launchpad-reviewers team
-
Mailing list archive
-
Message #25038
[Merge] ~pappacena/turnip:celery-repo-creation into turnip:master
Thiago F. Pappacena has proposed merging ~pappacena/turnip:celery-repo-creation into turnip:master with ~pappacena/turnip:async-repo-creation as a prerequisite.
Commit message:
Option on POST /repo API call to asynchronously create a repository using celery
Requested reviews:
Launchpad code reviewers (launchpad-reviewers)
For more details, see:
https://code.launchpad.net/~pappacena/turnip/+git/turnip/+merge/387612
--
Your team Launchpad code reviewers is requested to review the proposed merge of ~pappacena/turnip:celery-repo-creation into turnip:master.
diff --git a/Makefile b/Makefile
index d10a9b2..67f60cd 100644
--- a/Makefile
+++ b/Makefile
@@ -8,6 +8,7 @@ PIP_CACHE = $(CURDIR)/pip-cache
PYTHON := $(ENV)/bin/python
PSERVE := $(ENV)/bin/pserve
FLAKE8 := $(ENV)/bin/flake8
+CELERY := $(ENV)/bin/celery
PIP := $(ENV)/bin/pip
VIRTUALENV := virtualenv
@@ -64,7 +65,12 @@ endif
$(PIP) install $(PIP_ARGS) -c requirements.txt \
-e '.[test,deploy]'
-test: $(ENV)
+bootstrap-test:
+ -sudo rabbitmqctl delete_vhost turnip-test-vhost
+ -sudo rabbitmqctl add_vhost turnip-test-vhost
+ -sudo rabbitmqctl set_permissions -p "turnip-test-vhost" "guest" ".*" ".*" ".*"
+
+test: $(ENV) bootstrap-test
$(PYTHON) -m unittest discover $(ARGS) turnip
clean:
@@ -101,6 +107,24 @@ run-api: $(ENV)
run-pack: $(ENV)
$(PYTHON) turnipserver.py
+run-worker: $(ENV)
+ PYTHONPATH="turnip" $(CELERY) -A tasks worker \
+ --loglevel=info \
+ --concurrency=20 \
+ --pool=gevent
+
+run:
+ make run-api &\
+ make run-pack &\
+ make run-worker&\
+ wait;
+
+stop:
+ -pkill -f 'make run-api'
+ -pkill -f 'make run-pack'
+ -pkill -f 'make run-worker'
+ -pkill -f '$(CELERY) -A tasks worker'
+
$(PIP_CACHE): $(ENV)
mkdir -p $(PIP_CACHE)
$(PIP) install $(PIP_ARGS) -d $(PIP_CACHE) \
diff --git a/config.yaml b/config.yaml
index e078c33..99b0e7b 100644
--- a/config.yaml
+++ b/config.yaml
@@ -20,3 +20,4 @@ cgit_secret_path: null
openid_provider_root: https://testopenid.test/
site_name: git.launchpad.test
main_site_root: https://launchpad.test/
+celery_broker: pyamqp://guest@localhost//
diff --git a/requirements.txt b/requirements.txt
index 365f354..29ca5d2 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -4,9 +4,10 @@ attrs==19.3.0
Automat==20.2.0
bcrypt==3.1.7
beautifulsoup4==4.6.3
+celery==4.4.6
cffi==1.14.0
constantly==15.1.0
-contextlib2==0.4.0
+contextlib2==0.6.0
cornice==3.6.1
cryptography==2.8
docutils==0.14
@@ -15,6 +16,7 @@ envdir==0.7
extras==1.0.0
fixtures==3.0.0
flake8==2.4.0
+gevent==20.6.2
gmpy==1.17
gunicorn==19.3.0
hyperlink==19.0.0
@@ -31,6 +33,7 @@ Paste==2.0.2
PasteDeploy==2.1.0
pbr==5.4.4
pep8==1.5.7
+psutil==5.7.0
pyasn1==0.4.8
pycparser==2.17
pycrypto==2.6.1
diff --git a/setup.py b/setup.py
index 6eff51e..0c1f5f0 100755
--- a/setup.py
+++ b/setup.py
@@ -18,9 +18,11 @@ with open(os.path.join(here, 'NEWS')) as f:
README += "\n\n" + f.read()
requires = [
+ 'celery',
'contextlib2',
'cornice',
'enum34; python_version < "3.4"',
+ 'gevent',
'lazr.sshserver>=0.1.7',
'Paste',
'pygit2>=0.27.4,<0.28.0',
diff --git a/system-dependencies.txt b/system-dependencies.txt
index 845d453..fdcb1d8 100644
--- a/system-dependencies.txt
+++ b/system-dependencies.txt
@@ -6,3 +6,4 @@ libgit2-27
libssl-dev
python-dev
virtualenv
+rabbitmq-server
diff --git a/turnip/api/store.py b/turnip/api/store.py
index bf61ff6..d6568c3 100644
--- a/turnip/api/store.py
+++ b/turnip/api/store.py
@@ -27,7 +27,10 @@ from pygit2 import (
Repository,
)
+from turnip.config import config
+from turnip.helpers import TimeoutServerProxy
from turnip.pack.helpers import ensure_config
+from turnip.tasks import app
REF_TYPE_NAME = {
@@ -248,6 +251,27 @@ def init_repo(repo_path, clone_from=None, clone_refs=False,
set_repository_creating(repo_path, False)
+@app.task
+def init_and_confirm_repo(untranslated_path, repo_path, clone_from=None,
+ clone_refs=False, alternate_repo_paths=None,
+ is_bare=True):
+ xmlrpc_endpoint = config.get("virtinfo_endpoint")
+ xmlrpc_timeout = float(config.get("virtinfo_timeout"))
+ xmlrpc_auth_params = {"user": "+launchpad-services"}
+ xmlrpc_proxy = TimeoutServerProxy(
+ xmlrpc_endpoint, timeout=xmlrpc_timeout, allow_none=True)
+ try:
+ init_repo(
+ repo_path, clone_from, clone_refs, alternate_repo_paths, is_bare)
+ xmlrpc_proxy.confirmRepoCreation(untranslated_path, xmlrpc_auth_params)
+ except Exception:
+ try:
+ delete_repo(repo_path)
+ except IOError:
+ pass
+ xmlrpc_proxy.abortRepoCreation(untranslated_path, xmlrpc_auth_params)
+
+
@contextmanager
def open_repo(repo_store, repo_name, force_ephemeral=False):
"""Open an existing git repository. Optionally create an ephemeral
diff --git a/turnip/api/tests/test_api.py b/turnip/api/tests/test_api.py
index bcf13f9..5908143 100644
--- a/turnip/api/tests/test_api.py
+++ b/turnip/api/tests/test_api.py
@@ -6,9 +6,11 @@
from __future__ import print_function
import base64
+from datetime import timedelta, datetime
import os
import subprocess
from textwrap import dedent
+import time
import unittest
import uuid
@@ -22,6 +24,8 @@ from testtools.matchers import (
Equals,
MatchesSetwise,
)
+from twisted.internet import reactor as default_reactor
+from twisted.web import server
from webtest import TestApp
from turnip import api
@@ -31,12 +35,14 @@ from turnip.api.tests.test_helpers import (
open_repo,
RepoFactory,
)
+from turnip.config import config
+from turnip.pack.tests.fake_servers import FakeVirtInfoService
+from turnip.tests.compat import mock
+from turnip.tests.tasks import CeleryWorkerFixture
-class ApiTestCase(TestCase):
-
- def setUp(self):
- super(ApiTestCase, self).setUp()
+class ApiRepoStoreMixin:
+ def setupRepoStore(self):
repo_store = self.useFixture(TempDir()).path
self.useFixture(EnvironmentVariable("REPO_STORE", repo_store))
self.app = TestApp(api.main({}))
@@ -46,6 +52,13 @@ class ApiTestCase(TestCase):
self.commit = {'ref': 'refs/heads/master', 'message': 'test commit.'}
self.tag = {'ref': 'refs/tags/tag0', 'message': 'tag message'}
+
+class ApiTestCase(TestCase, ApiRepoStoreMixin):
+
+ def setUp(self):
+ super(ApiTestCase, self).setUp()
+ self.setupRepoStore()
+
def assertReferencesEqual(self, repo, expected, observed):
self.assertEqual(
repo.references[expected].peel().oid,
@@ -876,5 +889,159 @@ class ApiTestCase(TestCase):
self.assertEqual(404, resp.status_code)
+class AsyncRepoCreationAPI(TestCase, ApiRepoStoreMixin):
+
+ def setUp(self):
+ super(AsyncRepoCreationAPI, self).setUp()
+ self.setupRepoStore()
+ # XML-RPC server
+ self.virtinfo = FakeVirtInfoService(allowNone=True)
+ self.virtinfo_listener = default_reactor.listenTCP(0, server.Site(
+ self.virtinfo))
+ self.virtinfo_port = self.virtinfo_listener.getHost().port
+ self.virtinfo_url = b'http://localhost:%d/' % self.virtinfo_port
+ self.addCleanup(self.virtinfo_listener.stopListening)
+ config.defaults['virtinfo_endpoint'] = self.virtinfo_url
+
+ def _doReactorIteration(self):
+ """Yield to the reactor so it can process virtinfo requests.
+
+ This is a bit hacky, but allow us to simulate the twisted XML-RPC
+ fake server without needing to make this test suite async.
+ Making this test suite async could make it less realistic, since the
+ API beign tested itself is not running over twisted event loop.
+ """
+ reactor_iterations = (
+ len(default_reactor._reads) + len(default_reactor._writes))
+ for i in range(reactor_iterations * 100):
+ default_reactor.iterate()
+
+ def assertRepositoryCreatedAsynchronously(self, repo_path, timeout_secs=5):
+ """Waits up to `timeout_secs` for a repository to be available."""
+ timeout = timedelta(seconds=timeout_secs)
+ start = datetime.now()
+ while datetime.now() <= (start + timeout):
+ self._doReactorIteration()
+ try:
+ resp = self.app.get('/repo/{}'.format(repo_path),
+ expect_errors=True)
+ if resp.status_code == 200 and resp.json['is_available']:
+ return
+ except:
+ pass
+ time.sleep(0.1)
+ self.fail(
+ "Repository %s was not created after %s secs"
+ % (repo_path, timeout_secs))
+
+ def assertAnyMockCalledAsync(self, mocks, timeout_secs=5):
+ """Asserts that any of the mocks in *args will be called in the
+ next timeout_secs seconds.
+ """
+ timeout = timedelta(seconds=timeout_secs)
+ start = datetime.now()
+ while datetime.now() <= (start + timeout):
+ self._doReactorIteration()
+ if any(i.called for i in mocks):
+ return
+ time.sleep(0.1)
+ self.fail(
+ "None of the given args was called after %s seconds."
+ % timeout_secs)
+
+ def test_repo_async_creation_with_clone(self):
+ """Repo can be initialised with optional clone asynchronously."""
+ self.useFixture(CeleryWorkerFixture())
+ self.virtinfo.xmlrpc_confirmRepoCreation = mock.Mock(return_value=None)
+ self.virtinfo.xmlrpc_abortRepoCreation = mock.Mock(return_value=None)
+
+ factory = RepoFactory(self.repo_store, num_commits=2)
+ factory.build()
+ new_repo_path = uuid.uuid1().hex
+ resp = self.app.post_json('/repo', {
+ 'async': True,
+ 'repo_path': new_repo_path,
+ 'clone_from': self.repo_path,
+ 'clone_refs': True})
+
+ self.assertRepositoryCreatedAsynchronously(new_repo_path)
+
+ repo1_revlist = get_revlist(factory.repo)
+ clone_from = resp.json['repo_url'].split('/')[-1]
+ repo2 = open_repo(os.path.join(self.repo_root, clone_from))
+ repo2_revlist = get_revlist(repo2)
+
+ self.assertEqual(repo1_revlist, repo2_revlist)
+ self.assertEqual(200, resp.status_code)
+ self.assertIn(new_repo_path, resp.json['repo_url'])
+
+ self.assertEqual([mock.call(
+ mock.ANY, new_repo_path, {"user": "+launchpad-services"})],
+ self.virtinfo.xmlrpc_confirmRepoCreation.call_args_list)
+ self.assertEqual(
+ [], self.virtinfo.xmlrpc_abortRepoCreation.call_args_list)
+
+ def test_repo_async_creation_aborts_when_fails_to_create_locally(self):
+ """Repo can be initialised with optional clone asynchronously."""
+ self.useFixture(
+ EnvironmentVariable("REPO_STORE", '/tmp/invalid/path/to/repos/'))
+ self.useFixture(CeleryWorkerFixture())
+ self.virtinfo.xmlrpc_confirmRepoCreation = mock.Mock(return_value=None)
+ self.virtinfo.xmlrpc_abortRepoCreation = mock.Mock(return_value=None)
+
+ factory = RepoFactory(self.repo_store, num_commits=2)
+ factory.build()
+ new_repo_path = uuid.uuid1().hex
+ self.app.post_json('/repo', {
+ 'async': True,
+ 'repo_path': new_repo_path,
+ 'clone_from': self.repo_path,
+ 'clone_refs': True})
+
+ # Wait until the repository creation is either confirmed or aborted
+ # (and we hope it was aborted...)
+ self.assertAnyMockCalledAsync([
+ self.virtinfo.xmlrpc_confirmRepoCreation,
+ self.virtinfo.xmlrpc_abortRepoCreation])
+ self.assertFalse(
+ os.path.exists(os.path.join(self.repo_root, new_repo_path)))
+
+ self.assertEqual([mock.call(
+ mock.ANY, new_repo_path, {"user": "+launchpad-services"})],
+ self.virtinfo.xmlrpc_abortRepoCreation.call_args_list)
+ self.assertEqual(
+ [], self.virtinfo.xmlrpc_confirmRepoCreation.call_args_list)
+
+ def test_repo_async_creation_aborts_when_fails_confirm(self):
+ """Repo can be initialised with optional clone asynchronously."""
+ self.useFixture(CeleryWorkerFixture())
+ self.virtinfo.xmlrpc_confirmRepoCreation = mock.Mock(
+ side_effect=Exception("?"))
+ self.virtinfo.xmlrpc_abortRepoCreation = mock.Mock(return_value=None)
+
+ factory = RepoFactory(self.repo_store, num_commits=2)
+ factory.build()
+ new_repo_path = uuid.uuid1().hex
+ self.app.post_json('/repo', {
+ 'async': True,
+ 'repo_path': new_repo_path,
+ 'clone_from': self.repo_path,
+ 'clone_refs': True})
+
+ # Wait until the repository creation is either confirmed or aborted
+ # (and we hope it was aborted...)
+ self.assertAnyMockCalledAsync([
+ self.virtinfo.xmlrpc_abortRepoCreation])
+ self.assertFalse(
+ os.path.exists(os.path.join(self.repo_root, new_repo_path)))
+
+ self.assertEqual([mock.call(
+ mock.ANY, new_repo_path, {"user": "+launchpad-services"})],
+ self.virtinfo.xmlrpc_abortRepoCreation.call_args_list)
+ self.assertEqual([mock.call(
+ mock.ANY, new_repo_path, {"user": "+launchpad-services"})],
+ self.virtinfo.xmlrpc_confirmRepoCreation.call_args_list)
+
+
if __name__ == '__main__':
unittest.main()
diff --git a/turnip/api/views.py b/turnip/api/views.py
index 37e89ef..de6bb4e 100644
--- a/turnip/api/views.py
+++ b/turnip/api/views.py
@@ -57,6 +57,7 @@ class RepoAPI(BaseAPI):
repo_path = json_data.get('repo_path')
clone_path = json_data.get('clone_from')
clone_refs = json_data.get('clone_refs', False)
+ async_run = json_data.get('async', False)
if not repo_path:
self.request.errors.add('body', 'repo_path',
@@ -73,7 +74,13 @@ class RepoAPI(BaseAPI):
repo_clone = None
try:
- store.init_repo(repo, clone_from=repo_clone, clone_refs=clone_refs)
+ kwargs = dict(
+ repo_path=repo, clone_from=repo_clone, clone_refs=clone_refs)
+ if async_run:
+ kwargs["untranslated_path"] = repo_path
+ store.init_and_confirm_repo.apply_async(kwargs=kwargs)
+ else:
+ store.init_repo(**kwargs)
repo_name = os.path.basename(os.path.normpath(repo))
return {'repo_url': '/'.join([self.request.url, repo_name])}
except GitError:
diff --git a/turnip/helpers.py b/turnip/helpers.py
index 77e12ed..b23e4a6 100644
--- a/turnip/helpers.py
+++ b/turnip/helpers.py
@@ -10,6 +10,7 @@ from __future__ import (
import os.path
import six
+from six.moves import xmlrpc_client
def compose_path(root, path):
@@ -22,3 +23,24 @@ def compose_path(root, path):
if not full_path.startswith(os.path.abspath(root)):
raise ValueError('Path not contained within root')
return full_path
+
+
+class TimeoutTransport(xmlrpc_client.Transport):
+
+ def __init__(self, timeout, use_datetime=0):
+ self.timeout = timeout
+ xmlrpc_client.Transport.__init__(self, use_datetime)
+
+ def make_connection(self, host):
+ connection = xmlrpc_client.Transport.make_connection(self, host)
+ connection.timeout = self.timeout
+ return connection
+
+
+class TimeoutServerProxy(xmlrpc_client.ServerProxy):
+
+ def __init__(self, uri, timeout=10, transport=None, encoding=None,
+ verbose=0, allow_none=0, use_datetime=0):
+ t = TimeoutTransport(timeout)
+ xmlrpc_client.ServerProxy.__init__(
+ self, uri, t, encoding, verbose, allow_none, use_datetime)
diff --git a/turnip/tasks.py b/turnip/tasks.py
new file mode 100644
index 0000000..51b5d20
--- /dev/null
+++ b/turnip/tasks.py
@@ -0,0 +1,16 @@
+# Copyright 2020 Canonical Ltd. This software is licensed under the
+# GNU Affero General Public License version 3 (see the file LICENSE).
+
+from __future__ import print_function, unicode_literals, absolute_import
+
+__all__ = [
+ 'app'
+]
+
+from celery import Celery
+
+from turnip.config import config
+
+
+app = Celery('tasks', broker=config.get('celery_broker'))
+app.conf.update(imports=('turnip.api.store', ))
diff --git a/turnip/tests/__init__.py b/turnip/tests/__init__.py
index 494f3fd..6be77e3 100644
--- a/turnip/tests/__init__.py
+++ b/turnip/tests/__init__.py
@@ -8,6 +8,8 @@ from __future__ import (
)
from turnip.tests.logging import setupLogger
+from turnip.tests.tasks import setupCelery
setupLogger()
+setupCelery()
diff --git a/turnip/tests/tasks.py b/turnip/tests/tasks.py
new file mode 100644
index 0000000..401d079
--- /dev/null
+++ b/turnip/tests/tasks.py
@@ -0,0 +1,84 @@
+# Copyright 2020 Canonical Ltd. This software is licensed under the
+# GNU Affero General Public License version 3 (see the file LICENSE).
+
+import atexit
+import os
+import subprocess
+import sys
+
+from testtools.testcase import fixtures
+
+from turnip.config import config
+from turnip.tasks import app
+
+BROKER_URL = 'pyamqp://guest@localhost/turnip-test-vhost'
+
+
+def setupCelery():
+ app.conf.update(broker_url=BROKER_URL)
+
+
+class CeleryWorkerFixture(fixtures.Fixture):
+ """Celery worker fixture for tests
+
+ This fixture starts a celery worker with the configuration set when the
+ fixture is setUp. Keep in mind that this will run in a separated
+ new process, so mock patches for example will be lost.
+ """
+ _worker_proc = None
+
+ def __init__(self, loglevel="error", force_restart=True, env=None):
+ """
+ Build a celery worker for test cases.
+
+ :param loglevel: Which log level to use for the worker.
+ :param force_restart: If True and a celery worker is already running,
+ stop it. If False, do not restart if another worker is
+ already running.
+ :param env: The environment variables to be used when creating
+ the worker.
+ """
+ self.force_restart = force_restart
+ self.loglevel = loglevel
+ self.env = env
+
+ def startCeleryWorker(self):
+ """Start a celery worker for integration tests."""
+ if self.force_restart:
+ self.stopCeleryWorker()
+ if CeleryWorkerFixture._worker_proc is not None:
+ return
+ bin_path = os.path.dirname(sys.executable)
+ celery = os.path.join(bin_path, 'celery')
+ turnip_path = os.path.join(os.path.dirname(__file__), '..')
+ cmd = [
+ celery, 'worker', '-A', 'tasks', '--quiet',
+ '--pool=gevent',
+ '--concurrency=2',
+ '--broker=%s' % BROKER_URL,
+ '--loglevel=%s' % self.loglevel]
+
+ # Send to the subprocess, as env variables, the same configurations we
+ # are currently using.
+ proc_env = {'PYTHONPATH': turnip_path}
+ for k in config.defaults:
+ proc_env[k.upper()] = str(config.get(k))
+ proc_env.update(self.env or {})
+
+ CeleryWorkerFixture._worker_proc = subprocess.Popen(cmd, env=proc_env)
+ atexit.register(self.stopCeleryWorker)
+
+ def stopCeleryWorker(self):
+ worker_proc = CeleryWorkerFixture._worker_proc
+ if worker_proc:
+ worker_proc.kill()
+ worker_proc.wait()
+ CeleryWorkerFixture._worker_proc = None
+ # Cleanup the queue.
+ app.control.purge()
+
+ def _setUp(self):
+ self.startCeleryWorker()
+
+ def _cleanup(self):
+ self.stopCeleryWorker()
Follow ups