main.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372
  1. from modelverse_state import status
  2. import sys
  3. from collections import defaultdict
  4. import os
  5. import cPickle as pickle
  6. # Work around Python 2 where a 'big integer' automatically becomes a long
  7. if sys.version > '3': # pragma: no cover
  8. integer_types = (int,)
  9. primitive_types = (int, float, str, bool)
  10. else: # pragma: no cover
  11. integer_types = (int, long)
  12. primitive_types = (int, long, float, str, bool, unicode)
  13. complex_primitives = frozenset(["if", "while", "assign", "call", "break", "continue", "return","resolve","access", "constant", "input", "output", "declare", "global"])
  14. def instance_to_string(value):
  15. return value["value"]
  16. def string_to_instance(value):
  17. return {'value': value}
  18. class ModelverseState(object):
  19. def __init__(self, bootfile = None):
  20. self.free_id = 0
  21. self.edges = {}
  22. self.outgoing = defaultdict(set)
  23. self.incoming = defaultdict(set)
  24. self.values = {}
  25. self.nodes = set()
  26. self.GC = True
  27. self.to_delete = set()
  28. self.cache = {}
  29. if bootfile is not None:
  30. self.root = self.parse(bootfile)
  31. else:
  32. self.root, _ = self.create_node()
  33. def dump_modelverse(self):
  34. with open("/tmp/modelverse.out", "w") as f:
  35. f.write("digraph main {\n")
  36. for n in self.nodes:
  37. if n in self.values:
  38. f.write("a_%s [label=\"a_%s (%s)\"];\n" % (n, n, self.values[n]))
  39. else:
  40. f.write("a_%s [label=\"a_%s\"];\n" % (n, n))
  41. for i, e in self.edges.iteritems():
  42. f.write("%s -> %s [label=\"%s\"];\n" % (e[0], e[1], i))
  43. f.write("}")
  44. return (self.root, status.SUCCESS)
  45. def parse(self, filename):
  46. picklefile = filename + ".pickle"
  47. try:
  48. if os.path.getmtime(picklefile) > os.path.getmtime(filename):
  49. # Pickle is more recent than grammarfile, so we can use it
  50. self.root, self.free_id, self.nodes, self.edges, self.values = pickle.load(open(picklefile, 'rb'))
  51. for name in self.edges:
  52. source, destination = self.edges[name]
  53. self.outgoing[source].add(name)
  54. self.incoming[destination].add(name)
  55. return self.root
  56. else:
  57. raise Exception("Invalid pickle")
  58. except Exception as e:
  59. # We have to parse the file and create the pickle
  60. symbols = {}
  61. def resolve(symb):
  62. try:
  63. return int(symb)
  64. except:
  65. if symb[0] == "?":
  66. derefs = symb[1:].split("/")
  67. v, _ = self.read_dict(symbols["root"], "__hierarchy")
  68. for deref in derefs:
  69. v, _ = self.read_dict(v, deref)
  70. return v
  71. else:
  72. return symbols[symb]
  73. with open(filename, 'r') as f:
  74. for line in f:
  75. element_type, constructor = line.split(None, 1)
  76. name, values = constructor.split("(", 1)
  77. name = name.split()[0]
  78. values, _ = values.rsplit(")", 1)
  79. if element_type == "Node":
  80. if values == "":
  81. symbols[name], status = self.create_node()
  82. else:
  83. value = values
  84. if value in complex_primitives:
  85. value = string_to_instance(value)
  86. else:
  87. value = eval(value)
  88. symbols[name], status = self.create_nodevalue(value)
  89. elif element_type == "Edge":
  90. values = [v.split()[0] for v in values.split(",")]
  91. symbols[name], status = self.create_edge(resolve(values[0]), resolve(values[1]))
  92. else:
  93. raise Exception("Unknown element type: %s" % element_type)
  94. if status != 100:
  95. raise Exception("Failed to process line for reason %s: %s" % (status, line))
  96. # Creation successful, now also create a pickle
  97. with open(picklefile, 'wb') as f:
  98. pickle.dump((symbols["root"], self.free_id, self.nodes, self.edges, self.values), f, pickle.HIGHEST_PROTOCOL)
  99. return symbols["root"]
  100. def read_root(self):
  101. return (self.root, status.SUCCESS)
  102. def create_node(self):
  103. self.nodes.add(self.free_id)
  104. self.free_id += 1
  105. return (self.free_id - 1, status.SUCCESS)
  106. def create_edge(self, source, target):
  107. if source not in self.edges and source not in self.nodes:
  108. return (None, status.FAIL_CE_SOURCE)
  109. elif target not in self.edges and target not in self.nodes:
  110. return (None, status.FAIL_CE_TARGET)
  111. else:
  112. self.outgoing[source].add(self.free_id)
  113. self.incoming[target].add(self.free_id)
  114. self.edges[self.free_id] = (source, target)
  115. self.free_id += 1
  116. return (self.free_id - 1, status.SUCCESS)
  117. def is_valid_datavalue(self, value):
  118. if isinstance(value, dict):
  119. if "value" in value and value["value"] in complex_primitives:
  120. return True
  121. else:
  122. return False
  123. elif not isinstance(value, primitive_types):
  124. return False
  125. return True
  126. def create_nodevalue(self, value):
  127. if not self.is_valid_datavalue(value):
  128. print("Not correct: " + str(value))
  129. return (None, status.FAIL_CNV_OOB)
  130. self.values[self.free_id] = value
  131. self.nodes.add(self.free_id)
  132. self.free_id += 1
  133. return (self.free_id - 1, status.SUCCESS)
  134. def create_dict(self, source, data, destination):
  135. if source not in self.nodes and source not in self.edges:
  136. return (None, status.FAIL_CDICT_SOURCE)
  137. if destination not in self.nodes and destination not in self.edges:
  138. return (None, status.FAIL_CDICT_TARGET)
  139. if not self.is_valid_datavalue(data):
  140. return (None, status.FAIL_CDICT_OOB)
  141. n = self.create_nodevalue(data)[0]
  142. e = self.create_edge(source, destination)[0]
  143. self.create_edge(e, n)
  144. self.cache.setdefault(source, {})[data] = e
  145. return (None, status.SUCCESS)
  146. def read_value(self, node):
  147. if node not in self.nodes:
  148. return (None, status.FAIL_RV_UNKNOWN)
  149. v = self.values.get(node, None)
  150. if v is None:
  151. return (None, status.FAIL_RV_NO_VALUE)
  152. else:
  153. return (v, status.SUCCESS)
  154. def read_outgoing(self, elem):
  155. if elem in self.edges or elem in self.nodes:
  156. return (list(self.outgoing[elem]), status.SUCCESS)
  157. else:
  158. return (None, status.FAIL_RO_UNKNOWN)
  159. def read_incoming(self, elem):
  160. if elem in self.edges or elem in self.nodes:
  161. return (list(self.incoming[elem]), status.SUCCESS)
  162. else:
  163. return (None, status.FAIL_RI_UNKNOWN)
  164. def read_edge(self, edge):
  165. v = self.edges.get(edge, None)
  166. if v is None:
  167. return ([None, None], status.FAIL_RE_UNKNOWN)
  168. else:
  169. s, t = v
  170. return ([s, t], status.SUCCESS)
  171. def read_dict(self, node, value):
  172. e, s = self.read_dict_edge(node, value)
  173. if s != status.SUCCESS:
  174. return (None, {status.FAIL_RDICTE_UNKNOWN: status.FAIL_RDICT_UNKNOWN,
  175. status.FAIL_RDICTE_UNCERTAIN: status.FAIL_RDICT_UNCERTAIN,
  176. status.FAIL_RDICTE_OOB: status.FAIL_RDICT_OOB,
  177. status.FAIL_RDICTE_NOT_FOUND: status.FAIL_RDICT_NOT_FOUND,
  178. status.FAIL_RDICTE_AMBIGUOUS: status.FAIL_RDICT_AMBIGUOUS}[s])
  179. return (self.edges[e][1], status.SUCCESS)
  180. def read_dict_keys(self, node):
  181. if node not in self.nodes and node not in self.edges:
  182. return (None, status.FAIL_RDICTKEYS_UNKNOWN)
  183. result = []
  184. for e1 in self.outgoing.get(node, set()):
  185. data_links = self.outgoing.get(e1, set())
  186. for e2 in data_links:
  187. result.append(self.edges[e2][1])
  188. return (result, status.SUCCESS)
  189. def read_dict_edge(self, node, value):
  190. try:
  191. first = self.cache[node][str(value)]
  192. # Got hit, so validate
  193. if (self.edges[first][0] == node) and \
  194. (len(self.outgoing[first]) == 1) and \
  195. (self.values[self.edges[list(self.outgoing[first])[0]][1]] == value):
  196. return (first, status.SUCCESS)
  197. del self.cache[node][value]
  198. except KeyError:
  199. # Didn't exist
  200. pass
  201. if node not in self.nodes and node not in self.edges:
  202. return (None, status.FAIL_RDICTE_UNKNOWN)
  203. if not self.is_valid_datavalue(value):
  204. return (None, status.FAIL_RDICTE_OOB)
  205. # Get all outgoing links
  206. found = None
  207. for e1 in self.outgoing.get(node, set()):
  208. data_links = self.outgoing.get(e1, set())
  209. # For each link, we read the links that might link to a data value
  210. for e2 in data_links:
  211. # Now read out the target of the link
  212. target = self.edges[e2][1]
  213. # And access its value
  214. v = self.values.get(target, None)
  215. if v == value:
  216. # Found a match
  217. # Now get the target of the original link
  218. if found is not None:
  219. print("Duplicate key on value: %s (%s <-> %s)!" % (v, found, e1))
  220. return (None, status.FAIL_RDICTE_AMBIGUOUS)
  221. found = e1
  222. self.cache.setdefault(node, {})[value] = e1
  223. if found is not None:
  224. return (found, status.SUCCESS)
  225. else:
  226. return (None, status.FAIL_RDICTE_NOT_FOUND)
  227. def read_dict_node(self, node, value_node):
  228. e, s = self.read_dict_node_edge(node, value_node)
  229. if s != status.SUCCESS:
  230. return (None, {status.FAIL_RDICTNE_UNKNOWN: status.FAIL_RDICTN_UNKNOWN,
  231. status.FAIL_RDICTNE_UNCERTAIN: status.FAIL_RDICTN_UNCERTAIN,
  232. status.FAIL_RDICTNE_AMBIGUOUS: status.FAIL_RDICTN_AMBIGUOUS,
  233. status.FAIL_RDICTNE_OOB: status.FAIL_RDICTN_OOB,
  234. status.FAIL_RDICTNE_NOT_FOUND: status.FAIL_RDICTN_NOT_FOUND}[s])
  235. return (self.edges[e][1], status.SUCCESS)
  236. def read_dict_node_edge(self, node, value_node):
  237. if node not in self.nodes and node not in self.edges:
  238. return (None, status.FAIL_RDICTNE_UNKNOWN)
  239. # Get all outgoing links
  240. found = None
  241. for e1 in self.outgoing.get(node, set()):
  242. data_links = self.outgoing.get(e1, set())
  243. # For each link, we read the links that might link to a data value
  244. for e2 in data_links:
  245. # Now read out the target of the link
  246. target = self.edges[e2][1]
  247. # And access its value
  248. if target == value_node:
  249. # Found a match
  250. # Now get the target of the original link
  251. if found is not None:
  252. print("Duplicate key on node: %s (%s <-> %s)!" % (value_node, found, e1))
  253. return (None, status.FAIL_RDICTNE_AMBIGUOUS)
  254. found = e1
  255. if found is not None:
  256. return (found, status.SUCCESS)
  257. else:
  258. return (None, status.FAIL_RDICTNE_NOT_FOUND)
  259. def read_reverse_dict(self, node, value):
  260. if node not in self.nodes and node not in self.edges:
  261. return (None, status.FAIL_RRDICT_UNKNOWN)
  262. elif not self.is_valid_datavalue(value):
  263. return (None, status.FAIL_RRDICT_OOB)
  264. # Get all outgoing links
  265. matches = []
  266. for e1 in self.incoming.get(node, set()):
  267. data_links = self.outgoing.get(e1, set())
  268. # For each link, we read the links that might link to a data value
  269. for e2 in data_links:
  270. # Now read out the target of the link
  271. target = self.edges[e2][1]
  272. # And access its value
  273. v = self.values.get(target, None)
  274. if v == value:
  275. # Found a match
  276. if len(data_links) > 1:
  277. return (None, status.FAIL_RRDICT_UNCERTAIN)
  278. else:
  279. matches.append(e1)
  280. if len(matches) == 0:
  281. return (None, status.FAIL_RRDICT_NOT_FOUND)
  282. else:
  283. return ([self.edges[e][0] for e in matches], status.SUCCESS)
  284. def delete_node(self, node):
  285. if node is self.root:
  286. return (None, status.FAIL_DN_UNKNOWN)
  287. if node not in self.nodes:
  288. return (None, status.FAIL_DN_UNKNOWN)
  289. self.nodes.remove(node)
  290. if node in self.values:
  291. del self.values[node]
  292. s = set()
  293. for e in self.outgoing[node]:
  294. s.add(e)
  295. for e in self.incoming[node]:
  296. s.add(e)
  297. for e in s:
  298. self.delete_edge(e)
  299. del self.outgoing[node]
  300. del self.incoming[node]
  301. return (None, status.SUCCESS)
  302. def delete_edge(self, edge):
  303. if edge not in self.edges:
  304. return (None, status.FAIL_DE_UNKNOWN)
  305. s, t = self.edges[edge]
  306. self.incoming[t].remove(edge)
  307. self.outgoing[s].remove(edge)
  308. del self.edges[edge]
  309. s = set()
  310. for e in self.outgoing[edge]:
  311. s.add(e)
  312. for e in self.incoming[edge]:
  313. s.add(e)
  314. for e in s:
  315. self.delete_edge(e)
  316. del self.outgoing[edge]
  317. del self.incoming[edge]
  318. if (self.GC) and (not self.incoming[t]) and (t not in self.edges):
  319. # Remove this node as well
  320. # Edges aren't deleted like this, as they might have a reachable target and source!
  321. # If they haven't, they will be removed because the source was removed.
  322. self.to_delete.add(t)
  323. return (None, status.SUCCESS)
  324. def garbage_collect(self):
  325. while self.to_delete:
  326. self.delete_node(self.to_delete.pop())