1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172
|
# Copyright DataStax, Inc.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import logging
import time
from collections import defaultdict
from packaging.version import Version
from tests.integration import (get_node, get_cluster, wait_for_node_socket,
DSE_VERSION, CASSANDRA_VERSION)
IP_FORMAT = '127.0.0.%s'
log = logging.getLogger(__name__)
class CoordinatorStats():
def __init__(self):
self.coordinator_counts = defaultdict(int)
def add_coordinator(self, future):
log.debug('adding coordinator from {}'.format(future))
future.result()
coordinator = future._current_host.address
self.coordinator_counts[coordinator] += 1
if future._errors:
log.error('future._errors: %s', future._errors)
def reset_counts(self):
self.coordinator_counts = defaultdict(int)
def get_query_count(self, node):
ip = '127.0.0.%d' % node
return self.coordinator_counts[ip]
def assert_query_count_equals(self, testcase, node, expected):
ip = '127.0.0.%d' % node
if self.get_query_count(node) != expected:
testcase.fail('Expected %d queries to %s, but got %d. Query counts: %s' % (
expected, ip, self.coordinator_counts[ip], dict(self.coordinator_counts)))
def create_schema(cluster, session, keyspace, simple_strategy=True,
replication_factor=1, replication_strategy=None):
if keyspace in cluster.metadata.keyspaces.keys():
session.execute('DROP KEYSPACE %s' % keyspace, timeout=20)
if simple_strategy:
ddl = "CREATE KEYSPACE %s WITH replication" \
" = {'class': 'SimpleStrategy', 'replication_factor': '%s'}"
session.execute(ddl % (keyspace, replication_factor), timeout=10)
else:
if not replication_strategy:
raise Exception('replication_strategy is not set')
ddl = "CREATE KEYSPACE %s" \
" WITH replication = { 'class' : 'NetworkTopologyStrategy', %s }"
session.execute(ddl % (keyspace, str(replication_strategy)[1:-1]), timeout=10)
ddl = 'CREATE TABLE %s.cf (k int PRIMARY KEY, i int)'
session.execute(ddl % keyspace, timeout=10)
session.execute('USE %s' % keyspace)
def start(node):
get_node(node).start()
def stop(node):
get_node(node).stop()
def force_stop(node):
log.debug("Forcing stop of node %s", node)
get_node(node).stop(wait=False, gently=False)
log.debug("Node %s was stopped", node)
def decommission(node):
if (DSE_VERSION and DSE_VERSION >= Version("5.1")) or CASSANDRA_VERSION >= Version("4.0-a"):
# CASSANDRA-12510
get_node(node).decommission(force=True)
else:
get_node(node).decommission()
get_node(node).stop()
def bootstrap(node, data_center=None, token=None):
log.debug('called bootstrap('
'node={node}, data_center={data_center}, '
'token={token})')
cluster = get_cluster()
# for now assumes cluster has at least one node
node_type = type(next(iter(cluster.nodes.values())))
node_instance = node_type(
'node%s' % node,
cluster,
auto_bootstrap=False,
thrift_interface=(IP_FORMAT % node, 9160),
storage_interface=(IP_FORMAT % node, 7000),
binary_interface=(IP_FORMAT % node, 9042),
jmx_port=str(7000 + 100 * node),
remote_debug_port=0,
initial_token=token if token else node * 10
)
cluster.add(node_instance, is_seed=False, data_center=data_center)
try:
node_instance.start()
except Exception as e0:
log.debug('failed 1st bootstrap attempt with: \n{}'.format(e0))
# Try only twice
try:
node_instance.start()
except Exception as e1:
log.debug('failed 2nd bootstrap attempt with: \n{}'.format(e1))
log.error('Added node failed to start twice.')
raise e1
def ring(node):
get_node(node).nodetool('ring')
def wait_for_up(cluster, node):
tries = 0
addr = IP_FORMAT % node
while tries < 100:
host = cluster.metadata.get_host(addr)
if host and host.is_up:
wait_for_node_socket(get_node(node), 60)
log.debug("Done waiting for node %s to be up", node)
return
else:
log.debug("Host {} is still marked down, waiting".format(addr))
tries += 1
time.sleep(1)
# todo: don't mix string interpolation methods in the same package
raise RuntimeError("Host {0} is not up after {1} attempts".format(addr, tries))
def wait_for_down(cluster, node):
log.debug("Waiting for node %s to be down", node)
tries = 0
addr = IP_FORMAT % node
while tries < 100:
host = cluster.metadata.get_host(IP_FORMAT % node)
if not host or not host.is_up:
log.debug("Done waiting for node %s to be down", node)
return
else:
log.debug("Host is still marked up, waiting")
tries += 1
time.sleep(1)
raise RuntimeError("Host {0} is not down after {1} attempts".format(addr, tries))
|