fix caching and tests

This commit is contained in:
Neil Johnson 2018-08-03 13:49:53 +01:00
parent 897c51d274
commit 950807d93a
3 changed files with 80 additions and 62 deletions

View file

@ -64,7 +64,6 @@ from synapse.rest.media.v0.content_repository import ContentRepoResource
from synapse.server import HomeServer from synapse.server import HomeServer
from synapse.storage import are_all_users_on_domain from synapse.storage import are_all_users_on_domain
from synapse.storage.engines import IncorrectDatabaseSetup, create_engine from synapse.storage.engines import IncorrectDatabaseSetup, create_engine
from synapse.storage.monthly_active_users import MonthlyActiveUsersStore
from synapse.storage.prepare_database import UpgradeDatabaseException, prepare_database from synapse.storage.prepare_database import UpgradeDatabaseException, prepare_database
from synapse.util.caches import CACHE_SIZE_FACTOR from synapse.util.caches import CACHE_SIZE_FACTOR
from synapse.util.httpresourcetree import create_resource_tree from synapse.util.httpresourcetree import create_resource_tree

View file

@ -1,6 +1,21 @@
# -*- coding: utf-8 -*-
# Copyright 2018 New Vector
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from twisted.internet import defer from twisted.internet import defer
from synapse.util.caches.descriptors import cachedInlineCallbacks
from synapse.storage.engines import PostgresEngine, Sqlite3Engine from synapse.util.caches.descriptors import cached, cachedInlineCallbacks
from ._base import SQLBaseStore from ._base import SQLBaseStore
@ -9,7 +24,7 @@ class MonthlyActiveUsersStore(SQLBaseStore):
def __init__(self, dbconn, hs): def __init__(self, dbconn, hs):
super(MonthlyActiveUsersStore, self).__init__(None, hs) super(MonthlyActiveUsersStore, self).__init__(None, hs)
self._clock = hs.get_clock() self._clock = hs.get_clock()
self.max_mau_value = hs.config.max_mau_value self.hs = hs
def reap_monthly_active_users(self): def reap_monthly_active_users(self):
""" """
@ -19,62 +34,41 @@ class MonthlyActiveUsersStore(SQLBaseStore):
Defered() Defered()
""" """
def _reap_users(txn): def _reap_users(txn):
thirty_days_ago = ( thirty_days_ago = (
int(self._clock.time_msec()) - (1000 * 60 * 60 * 24 * 30) int(self._clock.time_msec()) - (1000 * 60 * 60 * 24 * 30)
) )
if isinstance(self.database_engine, PostgresEngine): sql = "DELETE FROM monthly_active_users WHERE timestamp < ?"
sql = """
DELETE FROM monthly_active_users
WHERE timestamp < ?
RETURNING user_id
"""
txn.execute(sql, (thirty_days_ago,))
res = txn.fetchall()
for r in res:
self.is_user_monthly_active.invalidate(r)
sql = """ txn.execute(sql, (thirty_days_ago,))
DELETE FROM monthly_active_users sql = """
ORDER BY timestamp desc DELETE FROM monthly_active_users
LIMIT -1 OFFSET ? ORDER BY timestamp desc
RETURNING user_id LIMIT -1 OFFSET ?
""" """
txn.execute(sql, (self.max_mau_value,)) txn.execute(sql, (self.hs.config.max_mau_value,))
res = txn.fetchall()
for r in res:
self.is_user_monthly_active.invalidate(r)
print r
self.get_monthly_active_count.invalidate()
elif isinstance(self.database_engine, Sqlite3Engine):
sql = "DELETE FROM monthly_active_users WHERE timestamp < ?"
txn.execute(sql, (thirty_days_ago,)) res = self.runInteraction("reap_monthly_active_users", _reap_users)
sql = """ # It seems poor to invalidate the whole cache, Postgres supports
DELETE FROM monthly_active_users # 'Returning' which would allow me to invalidate only the
ORDER BY timestamp desc # specific users, but sqlite has no way to do this and instead
LIMIT -1 OFFSET ? # I would need to SELECT and the DELETE which without locking
""" # is racy.
txn.execute(sql, (self.max_mau_value,)) # Have resolved to invalidate the whole cache for now and do
# something about it if and when the perf becomes significant
self.is_user_monthly_active.invalidate_all()
self.get_monthly_active_count.invalidate_all()
return res
# It seems poor to invalidate the whole cache, but the alternative @cached(num_args=0)
# is to select then delete which has its own problems.
# It seems unlikely that anyone using this feature on large datasets
# would be using sqlite and if they are then there will be
# larger perf issues than this one to encourage an upgrade to postgres.
self.is_user_monthly_active.invalidate_all()
self.get_monthly_active_count.invalidate_all()
return self.runInteraction("reap_monthly_active_users", _reap_users)
@cachedInlineCallbacks(num_args=0)
def get_monthly_active_count(self): def get_monthly_active_count(self):
""" """
Generates current count of monthly active users.abs Generates current count of monthly active users.abs
Return: Return:
Defered(int): Number of current monthly active users Defered(int): Number of current monthly active users
""" """
def _count_users(txn): def _count_users(txn):
sql = "SELECT COALESCE(count(*), 0) FROM monthly_active_users" sql = "SELECT COALESCE(count(*), 0) FROM monthly_active_users"
@ -91,7 +85,7 @@ class MonthlyActiveUsersStore(SQLBaseStore):
Deferred(bool): True if a new entry was created, False if an Deferred(bool): True if a new entry was created, False if an
existing one was updated. existing one was updated.
""" """
return self._simple_upsert( self._simple_upsert(
desc="upsert_monthly_active_user", desc="upsert_monthly_active_user",
table="monthly_active_users", table="monthly_active_users",
keyvalues={ keyvalues={
@ -102,6 +96,8 @@ class MonthlyActiveUsersStore(SQLBaseStore):
}, },
lock=False, lock=False,
) )
self.is_user_monthly_active.invalidate((user_id,))
self.get_monthly_active_count.invalidate(())
@cachedInlineCallbacks(num_args=1) @cachedInlineCallbacks(num_args=1)
def is_user_monthly_active(self, user_id): def is_user_monthly_active(self, user_id):
@ -120,5 +116,4 @@ class MonthlyActiveUsersStore(SQLBaseStore):
retcol="user_id", retcol="user_id",
desc="is_user_monthly_active", desc="is_user_monthly_active",
) )
defer.returnValue(bool(user_present)) defer.returnValue(bool(user_present))

View file

@ -1,6 +1,19 @@
from twisted.internet import defer # -*- coding: utf-8 -*-
# Copyright 2018 New Vector
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from synapse.storage.monthly_active_users import MonthlyActiveUsersStore from twisted.internet import defer
import tests.unittest import tests.unittest
import tests.utils import tests.utils
@ -10,20 +23,19 @@ from tests.utils import setup_test_homeserver
class MonthlyActiveUsersTestCase(tests.unittest.TestCase): class MonthlyActiveUsersTestCase(tests.unittest.TestCase):
def __init__(self, *args, **kwargs): def __init__(self, *args, **kwargs):
super(MonthlyActiveUsersTestCase, self).__init__(*args, **kwargs) super(MonthlyActiveUsersTestCase, self).__init__(*args, **kwargs)
self.mau = None
@defer.inlineCallbacks @defer.inlineCallbacks
def setUp(self): def setUp(self):
hs = yield setup_test_homeserver() self.hs = yield setup_test_homeserver()
self.mau = MonthlyActiveUsersStore(None, hs) self.store = self.hs.get_datastore()
@defer.inlineCallbacks @defer.inlineCallbacks
def test_can_insert_and_count_mau(self): def test_can_insert_and_count_mau(self):
count = yield self.mau.get_monthly_active_count() count = yield self.store.get_monthly_active_count()
self.assertEqual(0, count) self.assertEqual(0, count)
yield self.mau.upsert_monthly_active_user("@user:server") yield self.store.upsert_monthly_active_user("@user:server")
count = yield self.mau.get_monthly_active_count() count = yield self.store.get_monthly_active_count()
self.assertEqual(1, count) self.assertEqual(1, count)
@ -32,11 +44,23 @@ class MonthlyActiveUsersTestCase(tests.unittest.TestCase):
user_id1 = "@user1:server" user_id1 = "@user1:server"
user_id2 = "@user2:server" user_id2 = "@user2:server"
user_id3 = "@user3:server" user_id3 = "@user3:server"
result = yield self.mau.is_user_monthly_active(user_id1) result = yield self.store.is_user_monthly_active(user_id1)
self.assertFalse(result) self.assertFalse(result)
yield self.mau.upsert_monthly_active_user(user_id1) yield self.store.upsert_monthly_active_user(user_id1)
yield self.mau.upsert_monthly_active_user(user_id2) yield self.store.upsert_monthly_active_user(user_id2)
result = yield self.mau.is_user_monthly_active(user_id1) result = yield self.store.is_user_monthly_active(user_id1)
self.assertTrue(result) self.assertTrue(result)
result = yield self.mau.is_user_monthly_active(user_id3) result = yield self.store.is_user_monthly_active(user_id3)
self.assertFalse(result) self.assertFalse(result)
@defer.inlineCallbacks
def test_reap_monthly_active_users(self):
self.hs.config.max_mau_value = 5
initial_users = 10
for i in range(initial_users):
yield self.store.upsert_monthly_active_user("@user%d:server" % i)
count = yield self.store.get_monthly_active_count()
self.assertTrue(count, initial_users)
yield self.store.reap_monthly_active_users()
count = yield self.store.get_monthly_active_count()
self.assertTrue(count, initial_users - self.hs.config.max_mau_value)