1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
|
##############################################################################
# Copyright (c) 2017 ZTE Corporation and others.
#
# All rights reserved. This program and the accompanying materials
# are made available under the terms of the Apache License, Version 2.0
# which accompanies this distribution, and is available at
# http://www.apache.org/licenses/LICENSE-2.0
##############################################################################
import collections
from flask import Flask
from flask import request
import json
import time
from threading import Thread
import requests
from identity_auth import get_identity_auth
from identity_auth import get_session
from os_clients import nova_client
from inspector.base import BaseInspector
class SampleInspector(BaseInspector):
event_type = 'compute.host.down'
def __init__(self, conf, log):
super(SampleInspector, self).__init__(conf, log)
self.inspector_url = self.get_inspector_url()
self.novaclients = list()
self._init_novaclients()
# Normally we use this client for non redundant API calls
self.nova = self.novaclients[0]
self.servers = collections.defaultdict(list)
self.hostnames = list()
self.app = None
def _init_novaclients(self):
self.NUMBER_OF_CLIENTS = self.conf.instance_count
auth = get_identity_auth(project=self.conf.doctor_project)
session = get_session(auth=auth)
for i in range(self.NUMBER_OF_CLIENTS):
self.novaclients.append(
nova_client(self.conf.nova_version, session))
def _init_servers_list(self):
self.servers.clear()
opts = {'all_tenants': True}
servers = self.nova.servers.list(search_opts=opts)
for server in servers:
try:
host = server.__dict__.get('OS-EXT-SRV-ATTR:host')
self.servers[host].append(server)
self.log.debug('get hostname=%s from server=%s' % (host, server))
except Exception as e:
self.log.info('can not get hostname from server=%s' % server)
def get_inspector_url(self):
return 'http://%s:%s' % (self.conf.inspector.ip, self.conf.inspector.port)
def start(self):
self.log.info('sample inspector start......')
self._init_servers_list()
self.app = InspectorApp(self.conf.inspector.port, self, self.log)
self.app.start()
def stop(self):
self.log.info('sample inspector stop......')
if not self.app:
return
for hostname in self.hostnames:
self.nova.services.force_down(hostname, 'nova-compute', False)
headers = {
'Content-Type': 'application/json',
'Accept': 'application/json',
}
url = '%s%s' % (self.inspector_url, 'shutdown') \
if self.inspector_url.endswith('/') else \
'%s%s' % (self.inspector_url, '/shutdown')
requests.post(url, data='', headers=headers)
def handle_events(self, events):
for event in events:
hostname = event['details']['hostname']
event_type = event['type']
if event_type == self.event_type:
self.hostnames.append(hostname)
self.disable_compute_host(hostname)
def disable_compute_host(self, hostname):
threads = []
if len(self.servers[hostname]) > self.NUMBER_OF_CLIENTS:
# TODO(tojuvone): This could be enhanced in future with dynamic
# reuse of self.novaclients when all threads in use
self.log.error('%d servers in %s. Can handle only %d'%(
self.servers[hostname], hostname, self.NUMBER_OF_CLIENTS))
for nova, server in zip(self.novaclients, self.servers[hostname]):
t = ThreadedResetState(nova, "error", server, self.log)
t.start()
threads.append(t)
for t in threads:
t.join()
self.nova.services.force_down(hostname, 'nova-compute', True)
self.log.info('doctor mark host(%s) down at %s' % (hostname, time.time()))
class ThreadedResetState(Thread):
def __init__(self, nova, state, server, log):
Thread.__init__(self)
self.nova = nova
self.state = state
self.server = server
self.log = log
def run(self):
self.nova.servers.reset_state(self.server, self.state)
self.log.info('doctor mark vm(%s) error at %s' % (self.server, time.time()))
class InspectorApp(Thread):
def __init__(self, port, inspector, log):
Thread.__init__(self)
self.port = port
self.inspector = inspector
self.log = log
def run(self):
app = Flask('inspector')
@app.route('/events', methods=['PUT'])
def event_posted():
self.log.info('event posted in sample inspector at %s' % time.time())
self.log.info('sample inspector = %s' % self.inspector)
self.log.info('sample inspector received data = %s' % request.data)
events = json.loads(request.data)
self.inspector.handle_events(events)
return "OK"
@app.route('/shutdown', methods=['POST'])
def shutdown():
self.log.info('shutdown inspector app server at %s' % time.time())
func = request.environ.get('werkzeug.server.shutdown')
if func is None:
raise RuntimeError('Not running with the Werkzeug Server')
func()
return 'inspector app shutting down...'
app.run(host="0.0.0.0", port=self.port)
|