1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
|
##############################################################################
# Copyright (c) 2017 ZTE Corporation and others.
#
# All rights reserved. This program and the accompanying materials
# are made available under the terms of the Apache License, Version 2.0
# which accompanies this distribution, and is available at
# http://www.apache.org/licenses/LICENSE-2.0
##############################################################################
import collections
from flask import Flask
from flask import request
import json
import time
from threading import Thread
import requests
from identity_auth import get_identity_auth
from identity_auth import get_session
from os_clients import nova_client
from os_clients import neutron_client
from inspector.base import BaseInspector
import utils
class SampleInspector(BaseInspector):
event_type = 'compute.host.down'
def __init__(self, conf, log):
super(SampleInspector, self).__init__(conf, log)
self.inspector_url = self.get_inspector_url()
self.novaclients = list()
self._init_novaclients()
# Normally we use this client for non redundant API calls
self.nova = self.novaclients[0]
auth = get_identity_auth(project=self.conf.doctor_project)
session = get_session(auth=auth)
self.neutron = neutron_client(session)
self.servers = collections.defaultdict(list)
self.hostnames = list()
self.app = None
def _init_novaclients(self):
self.NUMBER_OF_CLIENTS = self.conf.instance_count
auth = get_identity_auth(project=self.conf.doctor_project)
session = get_session(auth=auth)
for i in range(self.NUMBER_OF_CLIENTS):
self.novaclients.append(
nova_client(self.conf.nova_version, session))
def _init_servers_list(self):
self.servers.clear()
opts = {'all_tenants': True}
servers = self.nova.servers.list(search_opts=opts)
for server in servers:
try:
host = server.__dict__.get('OS-EXT-SRV-ATTR:host')
self.servers[host].append(server)
self.log.debug('get hostname=%s from server=%s' % (host, server))
except Exception as e:
self.log.info('can not get hostname from server=%s' % server)
def get_inspector_url(self):
return 'http://%s:%s' % (self.conf.inspector.ip, self.conf.inspector.port)
def start(self):
self.log.info('sample inspector start......')
self._init_servers_list()
self.app = InspectorApp(self.conf.inspector.port, self, self.log)
self.app.start()
def stop(self):
self.log.info('sample inspector stop......')
if not self.app:
return
for hostname in self.hostnames:
self.nova.services.force_down(hostname, 'nova-compute', False)
headers = {
'Content-Type': 'application/json',
'Accept': 'application/json',
}
url = '%s%s' % (self.inspector_url, 'shutdown') \
if self.inspector_url.endswith('/') else \
'%s%s' % (self.inspector_url, '/shutdown')
requests.post(url, data='', headers=headers)
def handle_events(self, events):
for event in events:
hostname = event['details']['hostname']
event_type = event['type']
if event_type == self.event_type:
self.hostnames.append(hostname)
thr1 = self._disable_compute_host(hostname)
thr2 = self._vms_reset_state('error', hostname)
thr3 = self._set_ports_data_plane_status('DOWN', hostname)
thr1.join()
thr2.join()
thr3.join()
@utils.run_async
def _disable_compute_host(self, hostname):
self.nova.services.force_down(hostname, 'nova-compute', True)
self.log.info('doctor mark host(%s) down at %s' % (hostname, time.time()))
@utils.run_async
def _vms_reset_state(self, state, hostname):
@utils.run_async
def _vm_reset_state(nova, server, state):
nova.servers.reset_state(server, state)
self.log.info('doctor mark vm(%s) error at %s' % (server, time.time()))
thrs = []
for nova, server in zip(self.novaclients, self.servers[hostname]):
t = _vm_reset_state(nova, server, state)
thrs.append(t)
for t in thrs:
t.join()
@utils.run_async
def _set_ports_data_plane_status(self, status, hostname):
body = {'data_plane_status': status}
@utils.run_async
def _set_port_data_plane_status(port_id):
self.neutron.update_port(port_id, body)
self.log.info('doctor set data plane status %s on port %s' % (status, port_id))
thrs = []
params = {'binding:host_id': hostname}
for port_id in self.neutron.list_ports(**params):
t = _set_port_data_plane_status(port_id)
thrs.append(t)
for t in thrs:
t.join()
class InspectorApp(Thread):
def __init__(self, port, inspector, log):
Thread.__init__(self)
self.port = port
self.inspector = inspector
self.log = log
def run(self):
app = Flask('inspector')
@app.route('/events', methods=['PUT'])
def event_posted():
self.log.info('event posted in sample inspector at %s' % time.time())
self.log.info('sample inspector = %s' % self.inspector)
self.log.info('sample inspector received data = %s' % request.data)
events = json.loads(request.data.decode('utf8'))
self.inspector.handle_events(events)
return "OK"
@app.route('/shutdown', methods=['POST'])
def shutdown():
self.log.info('shutdown inspector app server at %s' % time.time())
func = request.environ.get('werkzeug.server.shutdown')
if func is None:
raise RuntimeError('Not running with the Werkzeug Server')
func()
return 'inspector app shutting down...'
app.run(host="0.0.0.0", port=self.port)
|