pvc/pvcd.py

133 lines
4.3 KiB
Python
Raw Normal View History

2018-05-31 20:26:44 -04:00
#!/usr/bin/env python3
# pvcd.py - PVC hypervisor node daemon
# Part of the Parallel Virtual Cluster (PVC) system
#
# Copyright (C) 2018 Joshua M. Boniface <joshua@boniface.me>
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <https://www.gnu.org/licenses/>.
#
###############################################################################
import kazoo.client
2018-05-31 20:26:44 -04:00
import libvirt
import sys
2018-05-31 21:49:23 -04:00
import socket
2018-05-31 20:26:44 -04:00
import uuid
import VMInstance
2018-05-31 21:49:23 -04:00
import NodeInstance
2018-05-31 20:26:44 -04:00
import time
2018-05-31 21:49:23 -04:00
import atexit
import apscheduler.schedulers.background
2018-06-06 22:59:31 -04:00
import ansiiprint
2018-05-31 20:26:44 -04:00
def help():
print(ansiiprint.bold() + "pvcd - Parallel Virtual Cluster management daemon" + ansiiprint.end())
2018-05-31 20:26:44 -04:00
# exit(0)
help()
# Connect to local zookeeper
zk = kazoo.client.KazooClient(hosts='127.0.0.1:2181')
2018-05-31 20:26:44 -04:00
try:
zk.start()
except:
print(ansiiprint.red() + "Failed to connect to local Zookeeper instance" + ansiiprint.end())
2018-05-31 20:26:44 -04:00
exit(1)
def zk_listener(state):
if state == kazoo.client.KazooState.LOST:
2018-05-31 22:31:20 -04:00
cleanup()
exit(2)
elif state == kazoo.client.KazooState.SUSPENDED:
2018-05-31 22:31:20 -04:00
cleanup()
exit(2)
2018-05-31 20:26:44 -04:00
else:
pass
zk.add_listener(zk_listener)
2018-05-31 22:31:20 -04:00
myhostname = socket.gethostname()
2018-05-31 23:33:07 -04:00
mynodestring = '/nodes/%s' % myhostname
2018-05-31 22:31:20 -04:00
2018-05-31 21:49:23 -04:00
def cleanup():
2018-06-01 00:35:39 -04:00
try:
update_timer.shutdown()
2018-06-04 02:35:41 -04:00
if t_node[myhostname].getstate() != 'flush':
2018-06-06 22:13:16 -04:00
zk.set('/nodes/{}/state'.format(myhostname), 'stop'.encode('ascii'))
zk.stop()
zk.close()
2018-06-01 00:35:39 -04:00
except:
pass
2018-05-31 20:26:44 -04:00
2018-05-31 21:49:23 -04:00
atexit.register(cleanup)
2018-05-31 20:26:44 -04:00
2018-05-31 22:55:44 -04:00
# Check if our node exists in Zookeeper, and create it if not
2018-06-06 22:13:16 -04:00
if zk.exists('/nodes/{}'.format(myhostname)):
print("Node is " + ansiiprint.green() + "present" + ansiiprint.end() + " in Zookeeper")
2018-05-31 23:04:34 -04:00
else:
print("Node is " + ansiiprint.red() + "absent" + ansiiprint.end() + " in Zookeeper; adding new node")
keepalive_time = int(time.time())
2018-06-06 22:13:16 -04:00
zk.create('/domains/{}'.format(myhostname), 'hypervisor'.encode('ascii'))
zk.create('/domains/{}/state'.format(myhostname), 'stop'.encode('ascii'))
zk.create('/domains/{}/cpucount'.format(myhostname), '0'.encode('ascii'))
zk.create('/domains/{}/memfree'.format(myhostname), '0'.encode('ascii'))
zk.create('/domains/{}/cpuload'.format(myhostname), '0.0'.encode('ascii'))
zk.create('/domains/{}/runningdomains'.format(myhostname), ''.encode('ascii'))
zk.create('/domains/{}/keepalive'.format(myhostname), str(keepalive_time).encode('ascii'))
2018-05-31 22:55:44 -04:00
2018-05-31 23:28:26 -04:00
t_node = dict()
s_domain = dict()
node_list = []
2018-06-04 02:22:59 -04:00
domain_list = []
2018-05-31 22:55:44 -04:00
2018-05-31 23:28:26 -04:00
@zk.ChildrenWatch('/nodes')
def updatenodes(new_node_list):
2018-06-04 02:22:59 -04:00
global node_list
2018-05-31 23:28:26 -04:00
node_list = new_node_list
print(ansiiprint.blue() + 'Node list: ' + ansiiprint.end() + '{}'.format(' '.join(node_list)))
2018-05-31 23:01:22 -04:00
for node in node_list:
2018-05-31 23:28:26 -04:00
if node in t_node:
t_node[node].updatenodelist(t_node)
2018-05-31 23:28:26 -04:00
else:
2018-06-04 02:22:59 -04:00
t_node[node] = NodeInstance.NodeInstance(node, t_node, s_domain, zk)
2018-05-31 20:26:44 -04:00
2018-06-01 01:32:19 -04:00
@zk.ChildrenWatch('/domains')
def updatedomains(new_domain_list):
2018-06-04 02:22:59 -04:00
global domain_list
2018-06-01 01:32:19 -04:00
domain_list = new_domain_list
print(ansiiprint.blue() + 'Domain list: ' + ansiiprint.end() + '{}'.format(' '.join(domain_list)))
2018-06-01 01:32:19 -04:00
for domain in domain_list:
if not domain in s_domain:
s_domain[domain] = VMInstance.VMInstance(domain, zk, t_node[myhostname]);
for node in node_list:
if node in t_node:
t_node[node].updatedomainlist(s_domain)
2018-05-31 20:26:44 -04:00
# Set up our update function
this_node = t_node[myhostname]
update_zookeeper = this_node.update_zookeeper
# Create timer to update this node in Zookeeper
update_timer = apscheduler.schedulers.background.BackgroundScheduler()
update_timer.add_job(update_zookeeper, 'interval', seconds=5)
update_timer.start()
2018-06-04 02:22:59 -04:00
# Tick loop
2018-05-31 20:26:44 -04:00
while True:
2018-05-31 21:49:23 -04:00
try:
2018-05-31 22:31:20 -04:00
time.sleep(0.1)
2018-05-31 21:49:23 -04:00
except:
break