sysvitals_api.py 10.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320
  1. #!/usr/bin/env python
  2. import gevent.monkey
  3. gevent.monkey.patch_all(thread=False)
  4. from collections import defaultdict
  5. import copy
  6. import datetime
  7. import errno
  8. import httplib
  9. import json
  10. import os
  11. from os import path
  12. import traceback
  13. import urlparse
  14. import gevent.pywsgi
  15. import config
  16. import db
  17. import fileio
  18. import reloader
  19. DATA_DIR = path.expanduser('~/sysvitals_data')
  20. handlers = None
  21. def main():
  22. global handlers
  23. handlers = {
  24. 'datum': post_datum,
  25. 'raw': get_raw,
  26. 'stats': get_stats,
  27. 'servers': get_servers,
  28. 'register_server': register_server,
  29. }
  30. server = gevent.pywsgi.WSGIServer(('0.0.0.0', config.api_port), application)
  31. if config.debug:
  32. reloader.init(server)
  33. print 'listening on', config.api_port
  34. server.serve_forever()
  35. class HTTPException(Exception):
  36. def __init__(self, code, body):
  37. self.code = code
  38. self.body = body
  39. BASE_HEADERS = [
  40. ('Access-Control-Allow-Origin', '*'),
  41. ('Access-Control-Allow-Headers', 'Authorization, X-Requested-With, X-Request'),
  42. ]
  43. DEFAULT_HEADERS = BASE_HEADERS + [('Content-type', 'application/json')]
  44. ERROR_HEADERS = BASE_HEADERS + [('Content-type', 'text/plain')]
  45. def application(environ, start_response):
  46. try:
  47. if environ['REQUEST_METHOD'] == 'OPTIONS':
  48. start_response('200 OK', copy.copy(DEFAULT_HEADERS))
  49. return []
  50. split = environ['PATH_INFO'][1:].split('/')
  51. qs = environ['QUERY_STRING']
  52. if qs:
  53. query = urlparse.parse_qs(qs, True, True)
  54. for k, v in query.iteritems():
  55. if len(v) > 1:
  56. raise HTTPException(400, 'duplicate query parameter: ' + k)
  57. query[k] = v[0]
  58. else:
  59. query = {}
  60. if split[0] == 'v1':
  61. handler = handlers.get(split[2])
  62. if handler:
  63. body = json.dumps(handler(split, query, environ))
  64. start_response('200 OK', copy.copy(DEFAULT_HEADERS))
  65. return [body]
  66. else:
  67. print 'no handler for', split
  68. else:
  69. print 'split was', split
  70. raise HTTPException(404, 'unhandled path: ' + environ['PATH_INFO'])
  71. except HTTPException as e:
  72. response = '%d %s' % (e.code, httplib.responses[e.code])
  73. start_response(response, copy.copy(ERROR_HEADERS))
  74. return [e.body]
  75. except:
  76. traceback.print_exc()
  77. start_response('500 Internal Server Error', copy.copy(ERROR_HEADERS))
  78. return ['ruh roh']
  79. def get_raw(split, query, environ):
  80. try:
  81. group_id = get_group(split, environ)
  82. server_id = int(split[3])
  83. start = datetime.datetime.strptime(query['start'], '%Y-%m-%d').date()
  84. end = datetime.datetime.strptime(query['end'], '%Y-%m-%d').date()
  85. except (IndexError, KeyError, ValueError):
  86. raise HTTPException(400, '')
  87. server_dir = path.join(DATA_DIR, str(group_id), str(server_id))
  88. rval = {}
  89. c = start
  90. while c <= end:
  91. date_str = c.isoformat()
  92. try:
  93. with open(path.join(server_dir, date_str), 'r') as f:
  94. data = fileio.read_stats(f)
  95. except IOError as e:
  96. if e.errno == errno.ENOENT:
  97. data = None
  98. else:
  99. raise
  100. rval[date_str] = data
  101. c += datetime.timedelta(days=1)
  102. return rval
  103. fields = {
  104. 'cpu': ['user', 'iowait', 'system', 'nice', 'guest', 'guest_nice', 'irq', 'softirq', 'steal', 'idle'],
  105. 'mem': ['used', 'buffers', 'cached', 'free'],
  106. 'net': ['bit/s_in', 'bit/s_out', 'err_in', 'err_out', 'drop_in', 'drop_out'],
  107. }
  108. def get_stats(split, query, environ):
  109. try:
  110. interval = int(query.get('interval', 1))
  111. except ValueError:
  112. raise HTTPException(400, 'interval must be integer')
  113. raw = get_raw(split, query, environ)
  114. dates = raw.keys()
  115. dates.sort()
  116. last_val = fileio.gen_template(-1)
  117. stats = defaultdict(dict)
  118. for date in dates:
  119. data = raw[date]
  120. if data is None:
  121. for field, subfields in fields.iteritems():
  122. for subfield in subfields:
  123. stats[field].setdefault(subfield, {})
  124. stats[field][subfield][date] = [None] * (1440 / interval)
  125. continue
  126. for field, subfields in data.items():
  127. if field == 'cpu':
  128. field_data = {}
  129. # subtract times from last minute, calculate total time spent each minute
  130. sums = [0] * 1440
  131. for subfield, raw_array in subfields.iteritems():
  132. if subfield != 'num_cpus':
  133. array = [None] * 1440
  134. for i, d in enumerate(raw_array):
  135. lv = last_val[field][subfield]
  136. if d > 0 and lv > 0:
  137. array[i] = d - lv
  138. sums[i] += array[i]
  139. last_val[field][subfield] = d
  140. field_data[subfield] = array
  141. # divide differences by total times
  142. for subfield, array in field_data.items():
  143. if subfield != 'num_cpus':
  144. for i, d in enumerate(array):
  145. if d > 0:
  146. array[i] = array[i] * subfields['num_cpus'][i] * 100 / sums[i]
  147. stats[field].setdefault(subfield, {})
  148. stats[field][subfield][date] = average(array, interval)
  149. elif field == 'mem':
  150. # translate total to free, subtract buffers and cached from used
  151. field_data = {}
  152. new_fields = ['used', 'buffers', 'cached', 'free']
  153. for subfield in new_fields:
  154. field_data[subfield] = [None] * 1440
  155. for i in xrange(1440):
  156. if subfields['total'][i] == -1:
  157. for nf in new_fields:
  158. field_data[nf][i] = None
  159. continue
  160. field_data['free'][i] = subfields['total'][i] - subfields['used'][i]
  161. field_data['used'][i] = subfields['used'][i] - subfields['buffers'][i] - subfields['cached'][i]
  162. field_data['buffers'][i] = subfields['buffers'][i]
  163. field_data['cached'][i] = subfields['cached'][i]
  164. for subfield, array in field_data.iteritems():
  165. stats[field].setdefault(subfield, {})
  166. stats[field][subfield][date] = average(array, interval)
  167. elif field == 'net':
  168. field_data = {}
  169. for subfield in ['bit/s_in', 'bit/s_out', 'err_in', 'err_out', 'drop_in', 'drop_out']:
  170. field_data[subfield] = [None] * 1440
  171. for i in xrange(1440):
  172. lv_recv = last_val['net']['bytes_recv']
  173. lv_sent = last_val['net']['bytes_sent']
  174. if lv_recv > 0:
  175. field_data['bit/s_in'][i] = (subfields['bytes_recv'][i] - lv_recv) * 8.0 / 60
  176. if lv_sent > 0:
  177. field_data['bit/s_out'][i] = (subfields['bytes_sent'][i] - lv_sent) * 8.0 / 60
  178. last_val['net']['bytes_recv'] = subfields['bytes_recv'][i]
  179. last_val['net']['bytes_sent'] = subfields['bytes_sent'][i]
  180. for subfield in ['err_in', 'err_out', 'drop_in', 'drop_out']:
  181. field_data[subfield][i] = subfields[subfield.replace('_', '')][i]
  182. for subfield, array in field_data.iteritems():
  183. stats[field].setdefault(subfield, {})
  184. stats[field][subfield][date] = average(array, interval)
  185. elif field == 'disk':
  186. field_data = {}
  187. for mountpoint, disk_sfs in subfields.items():
  188. used_key = mountpoint + '_used'
  189. free_key = mountpoint + '_free'
  190. field_data[used_key] = [None] * 1440
  191. field_data[free_key] = [None] * 1440
  192. for i in xrange(1440):
  193. if disk_sfs['total'][i] == -1:
  194. continue
  195. used = disk_sfs['used'][i]
  196. field_data[used_key][i] = used
  197. field_data[free_key][i] = disk_sfs['total'][i] - used
  198. for subfield, array in field_data.iteritems():
  199. stats[field].setdefault(subfield, {})
  200. stats[field][subfield][date] = average(array, interval)
  201. return stats
  202. def post_datum(split, query, environ):
  203. group_id = get_group(split, environ)
  204. try:
  205. server_id = int(split[3])
  206. except (IndexError, ValueError):
  207. raise HTTPException(400, '')
  208. body = load_json_body(environ)
  209. if body.keys() != fileio.TEMPLATE.keys():
  210. diff = set(body.keys()).symmetric_difference(set(fileio.TEMPLATE.keys()))
  211. raise HTTPException(400, 'post body had missing or extra keys: ' + ','.join(diff))
  212. server_dir = path.join(DATA_DIR, str(group_id), str(server_id))
  213. try:
  214. os.makedirs(server_dir)
  215. except OSError as e:
  216. if e.errno != errno.EEXIST:
  217. raise
  218. # we floor to the minute, so this rounds to the nearest minute
  219. now = datetime.datetime.utcnow() + datetime.timedelta(seconds=29)
  220. data_path = path.join(server_dir, now.date().isoformat())
  221. try:
  222. with open(data_path, 'r') as f:
  223. stats = fileio.read_stats(f)
  224. except IOError as e:
  225. if e.errno != errno.ENOENT:
  226. raise
  227. stats = copy.deepcopy(fileio.TEMPLATE)
  228. index = now.hour * 60 + now.minute
  229. data = {}
  230. for field, subfields in stats.iteritems():
  231. field_data = {}
  232. if field == 'disk':
  233. disk = stats['disk']
  234. for mountpoint, datum in body['disk'].iteritems(): # iterate through body to get new mountpoints
  235. disk.setdefault(mountpoint, {'total': [-1] * 1440, 'used': [-1] * 1440})
  236. field_data[mountpoint] = {}
  237. for subfield, array in disk[mountpoint].iteritems():
  238. array = list(array)
  239. array[index] = datum[subfield]
  240. field_data[mountpoint][subfield] = array
  241. else:
  242. for subfield, array in subfields.iteritems():
  243. array = list(array)
  244. array[index] = body[field][subfield]
  245. field_data[subfield] = array
  246. data[field] = field_data
  247. with open(data_path, 'w') as f:
  248. fileio.write_datum(f, data)
  249. return {'status': 'ok'}
  250. def get_servers(split, query, environ):
  251. group_id = get_group(split, environ)
  252. return db.get_servers(group_id)
  253. def register_server(split, query, environ):
  254. group_id = get_group(split, environ)
  255. body = load_json_body(environ)
  256. try:
  257. hostname = body['hostname']
  258. except KeyError:
  259. raise HTTPException(400, 'post body didn\'t contain "hostname" key')
  260. server_id = db.create_server(group_id, hostname)
  261. return {'server_id': server_id}
  262. def get_group(split, environ):
  263. try:
  264. group_id = int(split[1])
  265. except (IndexError, ValueError):
  266. raise HTTPException(400, '/v1/[group_id] - group_id was not valid int')
  267. if 'HTTP_AUTHORIZATION' not in environ:
  268. raise HTTPException(401, 'no api key passed in Authorization header')
  269. if db.get_api_key(group_id) != environ['HTTP_AUTHORIZATION']:
  270. raise HTTPException(403, 'api key did not match')
  271. return group_id
  272. def load_json_body(environ):
  273. try:
  274. body = json.load(environ['wsgi.input'])
  275. except ValueError:
  276. raise HTTPException(400, 'post body was not valid JSON')
  277. if not isinstance(body, dict):
  278. raise HTTPException(400, 'post body was not a JSON dictionary')
  279. return body
  280. def average(array, interval):
  281. if interval == 1:
  282. return array
  283. averaged = []
  284. accum = num_values = 0
  285. for i, v in enumerate(array):
  286. if v is not None:
  287. accum += v
  288. num_values += 1
  289. if (i + 1) % interval == 0:
  290. if num_values > 0:
  291. averaged.append(accum / num_values)
  292. else:
  293. averaged.append(None)
  294. accum = num_values = 0
  295. return averaged
  296. main()