paul@0 | 1 | #!/usr/bin/env python |
paul@0 | 2 | |
paul@0 | 3 | """ |
paul@0 | 4 | Import logic. |
paul@0 | 5 | |
paul@0 | 6 | Copyright (C) 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013, |
paul@0 | 7 | 2014, 2015, 2016 Paul Boddie <paul@boddie.org.uk> |
paul@0 | 8 | |
paul@0 | 9 | This program is free software; you can redistribute it and/or modify it under |
paul@0 | 10 | the terms of the GNU General Public License as published by the Free Software |
paul@0 | 11 | Foundation; either version 3 of the License, or (at your option) any later |
paul@0 | 12 | version. |
paul@0 | 13 | |
paul@0 | 14 | This program is distributed in the hope that it will be useful, but WITHOUT |
paul@0 | 15 | ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
paul@0 | 16 | FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
paul@0 | 17 | details. |
paul@0 | 18 | |
paul@0 | 19 | You should have received a copy of the GNU General Public License along with |
paul@0 | 20 | this program. If not, see <http://www.gnu.org/licenses/>. |
paul@0 | 21 | """ |
paul@0 | 22 | |
paul@0 | 23 | from errors import ProgramError |
paul@0 | 24 | from os.path import exists, extsep, getmtime, join |
paul@0 | 25 | from os import listdir, makedirs, remove |
paul@0 | 26 | from common import init_item, readfile, writefile |
paul@13 | 27 | from modules import CachedModule |
paul@0 | 28 | from referencing import Reference |
paul@0 | 29 | import inspector |
paul@0 | 30 | import sys |
paul@0 | 31 | |
paul@0 | 32 | class Importer: |
paul@0 | 33 | |
paul@0 | 34 | "An import machine, searching for and loading modules." |
paul@0 | 35 | |
paul@0 | 36 | def __init__(self, path, cache=None, verbose=False): |
paul@0 | 37 | |
paul@0 | 38 | """ |
paul@0 | 39 | Initialise the importer with the given search 'path' - a list of |
paul@0 | 40 | directories to search for Python modules. |
paul@0 | 41 | |
paul@0 | 42 | The optional 'cache' should be the name of a directory used to store |
paul@0 | 43 | cached module information. |
paul@0 | 44 | |
paul@0 | 45 | The optional 'verbose' parameter causes output concerning the activities |
paul@0 | 46 | of the object to be produced if set to a true value (not the default). |
paul@0 | 47 | """ |
paul@0 | 48 | |
paul@0 | 49 | self.path = path |
paul@0 | 50 | self.cache = cache |
paul@0 | 51 | self.verbose = verbose |
paul@0 | 52 | |
paul@41 | 53 | # Module importing queue, required modules, removed modules and active |
paul@41 | 54 | # modules in the final program. |
paul@41 | 55 | |
paul@12 | 56 | self.to_import = set() |
paul@16 | 57 | self.required = set(["__main__"]) |
paul@24 | 58 | self.removed = {} |
paul@41 | 59 | self.modules = {} |
paul@12 | 60 | |
paul@41 | 61 | # Module relationships and invalidated cached modules. |
paul@41 | 62 | |
paul@12 | 63 | self.accessing_modules = {} |
paul@0 | 64 | self.invalidated = set() |
paul@0 | 65 | |
paul@41 | 66 | # Basic program information. |
paul@41 | 67 | |
paul@0 | 68 | self.objects = {} |
paul@0 | 69 | self.classes = {} |
paul@0 | 70 | self.function_parameters = {} |
paul@0 | 71 | self.function_defaults = {} |
paul@109 | 72 | self.function_locals = {} |
paul@0 | 73 | self.function_targets = {} |
paul@0 | 74 | self.function_arguments = {} |
paul@0 | 75 | |
paul@41 | 76 | # Unresolved names. |
paul@41 | 77 | |
paul@41 | 78 | self.missing = set() |
paul@41 | 79 | |
paul@0 | 80 | # Derived information. |
paul@0 | 81 | |
paul@0 | 82 | self.subclasses = {} |
paul@0 | 83 | |
paul@0 | 84 | # Attributes of different object types. |
paul@0 | 85 | |
paul@0 | 86 | self.all_class_attrs = {} |
paul@0 | 87 | self.all_instance_attrs = {} |
paul@0 | 88 | self.all_instance_attr_constants = {} |
paul@0 | 89 | self.all_combined_attrs = {} |
paul@0 | 90 | self.all_module_attrs = {} |
paul@0 | 91 | self.all_shadowed_attrs = {} |
paul@0 | 92 | |
paul@0 | 93 | # References to external names and aliases within program units. |
paul@0 | 94 | |
paul@0 | 95 | self.all_name_references = {} |
paul@0 | 96 | self.all_initialised_names = {} |
paul@0 | 97 | self.all_aliased_names = {} |
paul@0 | 98 | |
paul@0 | 99 | # General attribute accesses. |
paul@0 | 100 | |
paul@0 | 101 | self.all_attr_accesses = {} |
paul@0 | 102 | self.all_const_accesses = {} |
paul@0 | 103 | self.all_attr_access_modifiers = {} |
paul@0 | 104 | |
paul@0 | 105 | # Constant literals and values. |
paul@0 | 106 | |
paul@0 | 107 | self.all_constants = {} |
paul@0 | 108 | self.all_constant_values = {} |
paul@0 | 109 | |
paul@0 | 110 | self.make_cache() |
paul@0 | 111 | |
paul@0 | 112 | def make_cache(self): |
paul@0 | 113 | if self.cache and not exists(self.cache): |
paul@0 | 114 | makedirs(self.cache) |
paul@0 | 115 | |
paul@0 | 116 | def check_cache(self, details): |
paul@0 | 117 | |
paul@0 | 118 | """ |
paul@0 | 119 | Check whether the cache applies for the given 'details', invalidating it |
paul@0 | 120 | if it does not. |
paul@0 | 121 | """ |
paul@0 | 122 | |
paul@0 | 123 | recorded_details = self.get_cache_details() |
paul@0 | 124 | |
paul@0 | 125 | if recorded_details != details: |
paul@0 | 126 | self.remove_cache() |
paul@0 | 127 | |
paul@0 | 128 | writefile(self.get_cache_details_filename(), details) |
paul@0 | 129 | |
paul@0 | 130 | def get_cache_details_filename(self): |
paul@0 | 131 | |
paul@0 | 132 | "Return the filename for the cache details." |
paul@0 | 133 | |
paul@0 | 134 | return join(self.cache, "$details") |
paul@0 | 135 | |
paul@0 | 136 | def get_cache_details(self): |
paul@0 | 137 | |
paul@0 | 138 | "Return details of the cache." |
paul@0 | 139 | |
paul@0 | 140 | details_filename = self.get_cache_details_filename() |
paul@0 | 141 | |
paul@0 | 142 | if not exists(details_filename): |
paul@0 | 143 | return None |
paul@0 | 144 | else: |
paul@0 | 145 | return readfile(details_filename) |
paul@0 | 146 | |
paul@0 | 147 | def remove_cache(self): |
paul@0 | 148 | |
paul@0 | 149 | "Remove the contents of the cache." |
paul@0 | 150 | |
paul@0 | 151 | for filename in listdir(self.cache): |
paul@0 | 152 | remove(join(self.cache, filename)) |
paul@0 | 153 | |
paul@0 | 154 | def to_cache(self): |
paul@0 | 155 | |
paul@0 | 156 | "Write modules to the cache." |
paul@0 | 157 | |
paul@0 | 158 | if self.cache: |
paul@0 | 159 | for module_name, module in self.modules.items(): |
paul@0 | 160 | module.to_cache(join(self.cache, module_name)) |
paul@0 | 161 | |
paul@0 | 162 | # Object retrieval and storage. |
paul@0 | 163 | |
paul@0 | 164 | def get_object(self, name): |
paul@0 | 165 | |
paul@0 | 166 | """ |
paul@0 | 167 | Return a reference for the given 'name' or None if no such object |
paul@0 | 168 | exists. |
paul@0 | 169 | """ |
paul@0 | 170 | |
paul@0 | 171 | return self.objects.get(name) |
paul@0 | 172 | |
paul@0 | 173 | def set_object(self, name, value=None): |
paul@0 | 174 | |
paul@0 | 175 | "Set the object with the given 'name' and the given 'value'." |
paul@0 | 176 | |
paul@0 | 177 | if isinstance(value, Reference): |
paul@0 | 178 | ref = value.alias(name) |
paul@0 | 179 | else: |
paul@0 | 180 | ref = Reference(value, name) |
paul@0 | 181 | |
paul@0 | 182 | self.objects[name] = ref |
paul@0 | 183 | |
paul@27 | 184 | # Identification of both stored object names and name references. |
paul@27 | 185 | |
paul@27 | 186 | def identify(self, name): |
paul@27 | 187 | |
paul@27 | 188 | "Identify 'name' using stored object and external name records." |
paul@27 | 189 | |
paul@177 | 190 | ref = self.objects.get(name) |
paul@177 | 191 | if not ref or ref.has_kind("<module>"): |
paul@177 | 192 | ref = self.all_name_references.get(name) or ref |
paul@177 | 193 | return ref |
paul@27 | 194 | |
paul@0 | 195 | # Indirect object retrieval. |
paul@0 | 196 | |
paul@0 | 197 | def get_attributes(self, ref, attrname): |
paul@0 | 198 | |
paul@0 | 199 | """ |
paul@0 | 200 | Return attributes provided by 'ref' for 'attrname'. Class attributes |
paul@0 | 201 | may be provided by instances. |
paul@0 | 202 | """ |
paul@0 | 203 | |
paul@0 | 204 | kind = ref.get_kind() |
paul@0 | 205 | if kind == "<class>": |
paul@0 | 206 | ref = self.get_class_attribute(ref.get_origin(), attrname) |
paul@0 | 207 | return ref and set([ref]) or set() |
paul@0 | 208 | elif kind == "<instance>": |
paul@0 | 209 | return self.get_combined_attributes(ref.get_origin(), attrname) |
paul@0 | 210 | elif kind == "<module>": |
paul@0 | 211 | ref = self.get_module_attribute(ref.get_origin(), attrname) |
paul@0 | 212 | return ref and set([ref]) or set() |
paul@0 | 213 | else: |
paul@0 | 214 | return set() |
paul@0 | 215 | |
paul@0 | 216 | def get_class_attribute(self, object_type, attrname): |
paul@0 | 217 | |
paul@0 | 218 | "Return from 'object_type' the details of class attribute 'attrname'." |
paul@0 | 219 | |
paul@0 | 220 | attr = self.all_class_attrs[object_type].get(attrname) |
paul@0 | 221 | return attr and self.get_object(attr) |
paul@0 | 222 | |
paul@0 | 223 | def get_instance_attributes(self, object_type, attrname): |
paul@0 | 224 | |
paul@0 | 225 | """ |
paul@0 | 226 | Return from 'object_type' the details of instance attribute 'attrname'. |
paul@0 | 227 | """ |
paul@0 | 228 | |
paul@0 | 229 | consts = self.all_instance_attr_constants.get(object_type) |
paul@0 | 230 | attrs = set() |
paul@0 | 231 | for attr in self.all_instance_attrs[object_type].get(attrname, []): |
paul@0 | 232 | attrs.add(consts and consts.get(attrname) or Reference("<var>", attr)) |
paul@0 | 233 | return attrs |
paul@0 | 234 | |
paul@0 | 235 | def get_combined_attributes(self, object_type, attrname): |
paul@0 | 236 | |
paul@0 | 237 | """ |
paul@0 | 238 | Return from 'object_type' the details of class or instance attribute |
paul@0 | 239 | 'attrname'. |
paul@0 | 240 | """ |
paul@0 | 241 | |
paul@0 | 242 | ref = self.get_class_attribute(object_type, attrname) |
paul@0 | 243 | refs = ref and set([ref]) or set() |
paul@0 | 244 | refs.update(self.get_instance_attributes(object_type, attrname)) |
paul@0 | 245 | return refs |
paul@0 | 246 | |
paul@0 | 247 | def get_module_attribute(self, object_type, attrname): |
paul@0 | 248 | |
paul@0 | 249 | "Return from 'object_type' the details of module attribute 'attrname'." |
paul@0 | 250 | |
paul@0 | 251 | if attrname in self.all_module_attrs[object_type]: |
paul@0 | 252 | return self.get_object("%s.%s" % (object_type, attrname)) |
paul@0 | 253 | else: |
paul@0 | 254 | return None |
paul@0 | 255 | |
paul@96 | 256 | # Convenience methods for deducing which kind of object provided an |
paul@96 | 257 | # attribute. |
paul@96 | 258 | |
paul@96 | 259 | def get_attribute_provider(self, ref, attrname): |
paul@96 | 260 | |
paul@96 | 261 | """ |
paul@96 | 262 | Return the kind of provider of the attribute accessed via 'ref' using |
paul@96 | 263 | 'attrname'. |
paul@96 | 264 | """ |
paul@96 | 265 | |
paul@96 | 266 | kind = ref.get_kind() |
paul@96 | 267 | |
paul@96 | 268 | if kind in ["<class>", "<module>"]: |
paul@96 | 269 | return kind |
paul@96 | 270 | else: |
paul@96 | 271 | return self.get_instance_attribute_provider(ref.get_origin(), attrname) |
paul@96 | 272 | |
paul@96 | 273 | def get_instance_attribute_provider(self, object_type, attrname): |
paul@96 | 274 | |
paul@96 | 275 | """ |
paul@96 | 276 | Return the kind of provider of the attribute accessed via an instance of |
paul@96 | 277 | 'object_type' using 'attrname'. |
paul@96 | 278 | """ |
paul@96 | 279 | |
paul@96 | 280 | if self.get_class_attribute(object_type, attrname): |
paul@96 | 281 | return "<class>" |
paul@96 | 282 | else: |
paul@96 | 283 | return "<instance>" |
paul@96 | 284 | |
paul@0 | 285 | # Module management. |
paul@0 | 286 | |
paul@16 | 287 | def queue_module(self, name, accessor, required=False): |
paul@12 | 288 | |
paul@12 | 289 | """ |
paul@12 | 290 | Queue the module with the given 'name' for import from the given |
paul@16 | 291 | 'accessor' module. If 'required' is true (it is false by default), the |
paul@16 | 292 | module will be required in the final program. |
paul@12 | 293 | """ |
paul@12 | 294 | |
paul@12 | 295 | if not self.modules.has_key(name): |
paul@12 | 296 | self.to_import.add(name) |
paul@12 | 297 | |
paul@16 | 298 | if required: |
paul@16 | 299 | self.required.add(name) |
paul@16 | 300 | |
paul@12 | 301 | init_item(self.accessing_modules, name, set) |
paul@16 | 302 | self.accessing_modules[name].add(accessor.name) |
paul@12 | 303 | |
paul@0 | 304 | def get_modules(self): |
paul@0 | 305 | |
paul@0 | 306 | "Return all modules known to the importer." |
paul@0 | 307 | |
paul@0 | 308 | return self.modules.values() |
paul@0 | 309 | |
paul@12 | 310 | def get_module(self, name): |
paul@0 | 311 | |
paul@0 | 312 | "Return the module with the given 'name'." |
paul@0 | 313 | |
paul@0 | 314 | if not self.modules.has_key(name): |
paul@0 | 315 | return None |
paul@0 | 316 | |
paul@12 | 317 | return self.modules[name] |
paul@0 | 318 | |
paul@0 | 319 | # Program operations. |
paul@0 | 320 | |
paul@0 | 321 | def initialise(self, filename, reset=False): |
paul@0 | 322 | |
paul@0 | 323 | """ |
paul@0 | 324 | Initialise a program whose main module is 'filename', resetting the |
paul@0 | 325 | cache if 'reset' is true. Return the main module. |
paul@0 | 326 | """ |
paul@0 | 327 | |
paul@0 | 328 | if reset: |
paul@0 | 329 | self.remove_cache() |
paul@0 | 330 | self.check_cache(filename) |
paul@0 | 331 | |
paul@0 | 332 | # Load the program itself. |
paul@0 | 333 | |
paul@0 | 334 | m = self.load_from_file(filename) |
paul@0 | 335 | |
paul@12 | 336 | # Load any queued modules. |
paul@12 | 337 | |
paul@12 | 338 | while self.to_import: |
paul@12 | 339 | for name in list(self.to_import): # avoid mutation issue |
paul@12 | 340 | self.load(name) |
paul@12 | 341 | |
paul@12 | 342 | # Resolve dependencies between modules. |
paul@12 | 343 | |
paul@12 | 344 | self.resolve() |
paul@12 | 345 | |
paul@16 | 346 | # Record the type of all classes. |
paul@16 | 347 | |
paul@177 | 348 | self.type_ref = self.get_object("__builtins__.core.type") |
paul@16 | 349 | |
paul@0 | 350 | # Resolve dependencies within the program. |
paul@0 | 351 | |
paul@12 | 352 | for module in self.modules.values(): |
paul@12 | 353 | module.complete() |
paul@0 | 354 | |
paul@16 | 355 | # Remove unneeded modules. |
paul@16 | 356 | |
paul@16 | 357 | all_modules = self.modules.items() |
paul@16 | 358 | |
paul@16 | 359 | for name, module in all_modules: |
paul@16 | 360 | if name not in self.required: |
paul@16 | 361 | module.unpropagate() |
paul@16 | 362 | del self.modules[name] |
paul@24 | 363 | self.removed[name] = module |
paul@16 | 364 | |
paul@68 | 365 | # Collect redundant objects. |
paul@68 | 366 | |
paul@68 | 367 | for module in self.removed.values(): |
paul@68 | 368 | module.collect() |
paul@68 | 369 | |
paul@68 | 370 | # Assert module objects where aliases have been removed. |
paul@68 | 371 | |
paul@68 | 372 | for name in self.required: |
paul@68 | 373 | if not self.objects.has_key(name): |
paul@68 | 374 | self.objects[name] = Reference("<module>", name) |
paul@68 | 375 | |
paul@0 | 376 | return m |
paul@0 | 377 | |
paul@0 | 378 | def finalise(self): |
paul@0 | 379 | |
paul@41 | 380 | """ |
paul@41 | 381 | Finalise the inspected program, returning whether the program could be |
paul@41 | 382 | finalised. |
paul@41 | 383 | """ |
paul@41 | 384 | |
paul@41 | 385 | if self.missing: |
paul@41 | 386 | return False |
paul@0 | 387 | |
paul@0 | 388 | self.finalise_classes() |
paul@0 | 389 | self.to_cache() |
paul@0 | 390 | self.set_class_types() |
paul@0 | 391 | self.define_instantiators() |
paul@0 | 392 | self.collect_constants() |
paul@0 | 393 | |
paul@41 | 394 | return True |
paul@41 | 395 | |
paul@12 | 396 | # Supporting operations. |
paul@12 | 397 | |
paul@12 | 398 | def resolve(self): |
paul@12 | 399 | |
paul@12 | 400 | "Resolve dependencies between modules." |
paul@12 | 401 | |
paul@35 | 402 | self.waiting = {} |
paul@35 | 403 | |
paul@35 | 404 | for module in self.modules.values(): |
paul@35 | 405 | |
paul@35 | 406 | # Resolve all deferred references in each module. |
paul@12 | 407 | |
paul@35 | 408 | for ref in module.deferred: |
paul@35 | 409 | found = self.find_dependency(ref) |
paul@35 | 410 | if not found: |
paul@41 | 411 | self.missing.add((module.name, ref.get_origin())) |
paul@35 | 412 | |
paul@35 | 413 | # Record the resolved names and identify required modules. |
paul@12 | 414 | |
paul@35 | 415 | else: |
paul@170 | 416 | # Find the providing module of this reference. |
paul@170 | 417 | # Where definitive details of the origin cannot be found, |
paul@170 | 418 | # identify the provider using the deferred reference. |
paul@170 | 419 | # NOTE: This may need to test for static origins. |
paul@170 | 420 | |
paul@170 | 421 | provider = self.get_module_provider(found.unresolved() and ref or found) |
paul@35 | 422 | ref.mutate(found) |
paul@35 | 423 | |
paul@35 | 424 | if provider: |
paul@16 | 425 | |
paul@35 | 426 | module.required.add(provider) |
paul@35 | 427 | self.accessing_modules[provider].add(module.name) |
paul@35 | 428 | |
paul@35 | 429 | # Postpone any inclusion of the provider until this |
paul@35 | 430 | # module becomes required. |
paul@12 | 431 | |
paul@35 | 432 | if module.name not in self.required: |
paul@35 | 433 | init_item(self.waiting, module.name, set) |
paul@35 | 434 | self.waiting[module.name].add(provider) |
paul@35 | 435 | |
paul@35 | 436 | # Make this module required in the accessing module. |
paul@32 | 437 | |
paul@53 | 438 | elif provider not in self.required: |
paul@35 | 439 | self.required.add(provider) |
paul@53 | 440 | if self.verbose: |
paul@53 | 441 | print >>sys.stderr, "Requiring", provider, "for", ref |
paul@35 | 442 | |
paul@38 | 443 | # Check modules again to see if they are now required and should now |
paul@38 | 444 | # cause the inclusion of other modules providing objects to the program. |
paul@38 | 445 | |
paul@35 | 446 | for module_name in self.waiting.keys(): |
paul@35 | 447 | self.require_providers(module_name) |
paul@16 | 448 | |
paul@35 | 449 | def require_providers(self, module_name): |
paul@38 | 450 | |
paul@38 | 451 | """ |
paul@38 | 452 | Test if 'module_name' is itself required and, if so, require modules |
paul@38 | 453 | containing objects provided to the module. |
paul@38 | 454 | """ |
paul@38 | 455 | |
paul@35 | 456 | if module_name in self.required and self.waiting.has_key(module_name): |
paul@35 | 457 | for provider in self.waiting[module_name]: |
paul@35 | 458 | if provider not in self.required: |
paul@35 | 459 | self.required.add(provider) |
paul@53 | 460 | if self.verbose: |
paul@53 | 461 | print >>sys.stderr, "Requiring", provider |
paul@35 | 462 | self.require_providers(provider) |
paul@32 | 463 | |
paul@12 | 464 | def find_dependency(self, ref): |
paul@12 | 465 | |
paul@12 | 466 | "Find the ultimate dependency for 'ref'." |
paul@12 | 467 | |
paul@12 | 468 | found = set() |
paul@12 | 469 | while ref and ref.has_kind("<depends>") and not ref in found: |
paul@12 | 470 | found.add(ref) |
paul@35 | 471 | ref = self.identify(ref.get_origin()) |
paul@12 | 472 | return ref |
paul@12 | 473 | |
paul@16 | 474 | def get_module_provider(self, ref): |
paul@16 | 475 | |
paul@16 | 476 | "Identify the provider of the given 'ref'." |
paul@16 | 477 | |
paul@16 | 478 | for ancestor in ref.ancestors(): |
paul@16 | 479 | if self.modules.has_key(ancestor): |
paul@16 | 480 | return ancestor |
paul@16 | 481 | return None |
paul@16 | 482 | |
paul@0 | 483 | def finalise_classes(self): |
paul@0 | 484 | |
paul@0 | 485 | "Finalise the class relationships and attributes." |
paul@0 | 486 | |
paul@0 | 487 | self.derive_inherited_attrs() |
paul@0 | 488 | self.derive_subclasses() |
paul@0 | 489 | self.derive_shadowed_attrs() |
paul@0 | 490 | |
paul@0 | 491 | def derive_inherited_attrs(self): |
paul@0 | 492 | |
paul@0 | 493 | "Derive inherited attributes for classes throughout the program." |
paul@0 | 494 | |
paul@0 | 495 | for name in self.classes.keys(): |
paul@0 | 496 | self.propagate_attrs_for_class(name) |
paul@0 | 497 | |
paul@0 | 498 | def propagate_attrs_for_class(self, name, visited=None): |
paul@0 | 499 | |
paul@0 | 500 | "Propagate inherited attributes for class 'name'." |
paul@0 | 501 | |
paul@0 | 502 | # Visit classes only once. |
paul@0 | 503 | |
paul@0 | 504 | if self.all_combined_attrs.has_key(name): |
paul@0 | 505 | return |
paul@0 | 506 | |
paul@0 | 507 | visited = visited or [] |
paul@0 | 508 | |
paul@0 | 509 | if name in visited: |
paul@0 | 510 | raise ProgramError, "Class %s may not inherit from itself: %s -> %s." % (name, " -> ".join(visited), name) |
paul@0 | 511 | |
paul@0 | 512 | visited.append(name) |
paul@0 | 513 | |
paul@0 | 514 | class_attrs = {} |
paul@0 | 515 | instance_attrs = {} |
paul@0 | 516 | |
paul@0 | 517 | # Aggregate the attributes from base classes, recording the origins of |
paul@0 | 518 | # applicable attributes. |
paul@0 | 519 | |
paul@0 | 520 | for base in self.classes[name][::-1]: |
paul@0 | 521 | |
paul@0 | 522 | # Get the identity of the class from the reference. |
paul@0 | 523 | |
paul@0 | 524 | base = base.get_origin() |
paul@0 | 525 | |
paul@0 | 526 | # Define the base class completely before continuing with this |
paul@0 | 527 | # class. |
paul@0 | 528 | |
paul@0 | 529 | self.propagate_attrs_for_class(base, visited) |
paul@0 | 530 | class_attrs.update(self.all_class_attrs[base]) |
paul@0 | 531 | |
paul@0 | 532 | # Instance attribute origins are combined if different. |
paul@0 | 533 | |
paul@0 | 534 | for key, values in self.all_instance_attrs[base].items(): |
paul@0 | 535 | init_item(instance_attrs, key, set) |
paul@0 | 536 | instance_attrs[key].update(values) |
paul@0 | 537 | |
paul@0 | 538 | # Class attributes override those defined earlier in the hierarchy. |
paul@0 | 539 | |
paul@0 | 540 | class_attrs.update(self.all_class_attrs.get(name, {})) |
paul@0 | 541 | |
paul@0 | 542 | # Instance attributes are merely added if not already defined. |
paul@0 | 543 | |
paul@0 | 544 | for key in self.all_instance_attrs.get(name, []): |
paul@0 | 545 | if not instance_attrs.has_key(key): |
paul@0 | 546 | instance_attrs[key] = set(["%s.%s" % (name, key)]) |
paul@0 | 547 | |
paul@0 | 548 | self.all_class_attrs[name] = class_attrs |
paul@0 | 549 | self.all_instance_attrs[name] = instance_attrs |
paul@0 | 550 | self.all_combined_attrs[name] = set(class_attrs.keys()).union(instance_attrs.keys()) |
paul@0 | 551 | |
paul@0 | 552 | def derive_subclasses(self): |
paul@0 | 553 | |
paul@0 | 554 | "Derive subclass details for classes." |
paul@0 | 555 | |
paul@0 | 556 | for name, bases in self.classes.items(): |
paul@0 | 557 | for base in bases: |
paul@0 | 558 | |
paul@0 | 559 | # Get the identity of the class from the reference. |
paul@0 | 560 | |
paul@0 | 561 | base = base.get_origin() |
paul@0 | 562 | self.subclasses[base].add(name) |
paul@0 | 563 | |
paul@0 | 564 | def derive_shadowed_attrs(self): |
paul@0 | 565 | |
paul@0 | 566 | "Derive shadowed attributes for classes." |
paul@0 | 567 | |
paul@0 | 568 | for name, attrs in self.all_instance_attrs.items(): |
paul@0 | 569 | attrs = set(attrs.keys()).intersection(self.all_class_attrs[name].keys()) |
paul@0 | 570 | if attrs: |
paul@0 | 571 | self.all_shadowed_attrs[name] = attrs |
paul@0 | 572 | |
paul@0 | 573 | def set_class_types(self): |
paul@0 | 574 | |
paul@0 | 575 | "Set the type of each class." |
paul@0 | 576 | |
paul@0 | 577 | for attrs in self.all_class_attrs.values(): |
paul@16 | 578 | attrs["__class__"] = self.type_ref.get_origin() |
paul@0 | 579 | |
paul@0 | 580 | def define_instantiators(self): |
paul@0 | 581 | |
paul@0 | 582 | """ |
paul@0 | 583 | Consolidate parameter and default details, incorporating initialiser |
paul@0 | 584 | details to define instantiator signatures. |
paul@0 | 585 | """ |
paul@0 | 586 | |
paul@0 | 587 | for cls, attrs in self.all_class_attrs.items(): |
paul@0 | 588 | initialiser = attrs["__init__"] |
paul@119 | 589 | self.function_parameters[cls] = self.function_parameters[initialiser] |
paul@0 | 590 | self.function_defaults[cls] = self.function_defaults[initialiser] |
paul@0 | 591 | |
paul@0 | 592 | def collect_constants(self): |
paul@0 | 593 | |
paul@0 | 594 | "Get constants from all active modules." |
paul@0 | 595 | |
paul@0 | 596 | for module in self.modules.values(): |
paul@0 | 597 | self.all_constants.update(module.constants) |
paul@0 | 598 | |
paul@0 | 599 | # Import methods. |
paul@0 | 600 | |
paul@0 | 601 | def find_in_path(self, name): |
paul@0 | 602 | |
paul@0 | 603 | """ |
paul@0 | 604 | Find the given module 'name' in the search path, returning None where no |
paul@0 | 605 | such module could be found, or a 2-tuple from the 'find' method |
paul@0 | 606 | otherwise. |
paul@0 | 607 | """ |
paul@0 | 608 | |
paul@0 | 609 | for d in self.path: |
paul@0 | 610 | m = self.find(d, name) |
paul@0 | 611 | if m: return m |
paul@0 | 612 | return None |
paul@0 | 613 | |
paul@0 | 614 | def find(self, d, name): |
paul@0 | 615 | |
paul@0 | 616 | """ |
paul@0 | 617 | In the directory 'd', find the given module 'name', where 'name' can |
paul@0 | 618 | either refer to a single file module or to a package. Return None if the |
paul@0 | 619 | 'name' cannot be associated with either a file or a package directory, |
paul@0 | 620 | or a 2-tuple from '_find_package' or '_find_module' otherwise. |
paul@0 | 621 | """ |
paul@0 | 622 | |
paul@0 | 623 | m = self._find_package(d, name) |
paul@0 | 624 | if m: return m |
paul@0 | 625 | m = self._find_module(d, name) |
paul@0 | 626 | if m: return m |
paul@0 | 627 | return None |
paul@0 | 628 | |
paul@0 | 629 | def _find_module(self, d, name): |
paul@0 | 630 | |
paul@0 | 631 | """ |
paul@0 | 632 | In the directory 'd', find the given module 'name', returning None where |
paul@0 | 633 | no suitable file exists in the directory, or a 2-tuple consisting of |
paul@0 | 634 | None (indicating that no package directory is involved) and a filename |
paul@0 | 635 | indicating the location of the module. |
paul@0 | 636 | """ |
paul@0 | 637 | |
paul@0 | 638 | name_py = name + extsep + "py" |
paul@0 | 639 | filename = self._find_file(d, name_py) |
paul@0 | 640 | if filename: |
paul@0 | 641 | return None, filename |
paul@0 | 642 | return None |
paul@0 | 643 | |
paul@0 | 644 | def _find_package(self, d, name): |
paul@0 | 645 | |
paul@0 | 646 | """ |
paul@0 | 647 | In the directory 'd', find the given package 'name', returning None |
paul@0 | 648 | where no suitable package directory exists, or a 2-tuple consisting of |
paul@0 | 649 | a directory (indicating the location of the package directory itself) |
paul@0 | 650 | and a filename indicating the location of the __init__.py module which |
paul@0 | 651 | declares the package's top-level contents. |
paul@0 | 652 | """ |
paul@0 | 653 | |
paul@0 | 654 | filename = self._find_file(d, name) |
paul@0 | 655 | if filename: |
paul@0 | 656 | init_py = "__init__" + extsep + "py" |
paul@0 | 657 | init_py_filename = self._find_file(filename, init_py) |
paul@0 | 658 | if init_py_filename: |
paul@0 | 659 | return filename, init_py_filename |
paul@0 | 660 | return None |
paul@0 | 661 | |
paul@0 | 662 | def _find_file(self, d, filename): |
paul@0 | 663 | |
paul@0 | 664 | """ |
paul@0 | 665 | Return the filename obtained when searching the directory 'd' for the |
paul@0 | 666 | given 'filename', or None if no actual file exists for the filename. |
paul@0 | 667 | """ |
paul@0 | 668 | |
paul@0 | 669 | filename = join(d, filename) |
paul@0 | 670 | if exists(filename): |
paul@0 | 671 | return filename |
paul@0 | 672 | else: |
paul@0 | 673 | return None |
paul@0 | 674 | |
paul@12 | 675 | def load(self, name): |
paul@0 | 676 | |
paul@0 | 677 | """ |
paul@0 | 678 | Load the module or package with the given 'name'. Return an object |
paul@0 | 679 | referencing the loaded module or package, or None if no such module or |
paul@0 | 680 | package exists. |
paul@0 | 681 | """ |
paul@0 | 682 | |
paul@0 | 683 | # Loaded modules are returned immediately. |
paul@0 | 684 | # Modules may be known but not yet loading (having been registered as |
paul@0 | 685 | # submodules), loading, loaded, or completely unknown. |
paul@0 | 686 | |
paul@12 | 687 | module = self.get_module(name) |
paul@0 | 688 | |
paul@0 | 689 | if module: |
paul@12 | 690 | return self.modules[name] |
paul@0 | 691 | |
paul@0 | 692 | # Otherwise, modules are loaded. |
paul@0 | 693 | |
paul@0 | 694 | # Split the name into path components, and try to find the uppermost in |
paul@0 | 695 | # the search path. |
paul@0 | 696 | |
paul@0 | 697 | path = name.split(".") |
paul@0 | 698 | path_so_far = [] |
paul@12 | 699 | module = None |
paul@0 | 700 | |
paul@0 | 701 | for p in path: |
paul@0 | 702 | |
paul@0 | 703 | # Get the module's filesystem details. |
paul@0 | 704 | |
paul@0 | 705 | if not path_so_far: |
paul@0 | 706 | m = self.find_in_path(p) |
paul@0 | 707 | elif d: |
paul@0 | 708 | m = self.find(d, p) |
paul@0 | 709 | else: |
paul@0 | 710 | m = None |
paul@0 | 711 | |
paul@0 | 712 | path_so_far.append(p) |
paul@0 | 713 | module_name = ".".join(path_so_far) |
paul@0 | 714 | |
paul@0 | 715 | if not m: |
paul@0 | 716 | if self.verbose: |
paul@0 | 717 | print >>sys.stderr, "Not found (%s)" % name |
paul@0 | 718 | |
paul@0 | 719 | return None # NOTE: Import error. |
paul@0 | 720 | |
paul@0 | 721 | # Get the module itself. |
paul@0 | 722 | |
paul@0 | 723 | d, filename = m |
paul@12 | 724 | module = self.load_from_file(filename, module_name) |
paul@0 | 725 | |
paul@12 | 726 | return module |
paul@0 | 727 | |
paul@12 | 728 | def load_from_file(self, filename, module_name=None): |
paul@0 | 729 | |
paul@0 | 730 | "Load the module from the given 'filename'." |
paul@0 | 731 | |
paul@0 | 732 | if module_name is None: |
paul@0 | 733 | module_name = "__main__" |
paul@0 | 734 | |
paul@0 | 735 | module = self.modules.get(module_name) |
paul@0 | 736 | |
paul@0 | 737 | if not module: |
paul@0 | 738 | |
paul@0 | 739 | # Try to load from cache. |
paul@0 | 740 | |
paul@12 | 741 | module = self.load_from_cache(filename, module_name) |
paul@0 | 742 | if module: |
paul@0 | 743 | return module |
paul@0 | 744 | |
paul@0 | 745 | # If no cache entry exists, load from file. |
paul@0 | 746 | |
paul@0 | 747 | module = inspector.InspectedModule(module_name, self) |
paul@0 | 748 | self.add_module(module_name, module) |
paul@0 | 749 | self.update_cache_validity(module) |
paul@0 | 750 | |
paul@12 | 751 | self._load(module, module_name, lambda m: m.parse, filename) |
paul@0 | 752 | |
paul@0 | 753 | return module |
paul@0 | 754 | |
paul@0 | 755 | def update_cache_validity(self, module): |
paul@0 | 756 | |
paul@0 | 757 | "Make 'module' valid in the cache, but invalidate accessing modules." |
paul@0 | 758 | |
paul@12 | 759 | accessing = self.accessing_modules.get(module.name) |
paul@12 | 760 | if accessing: |
paul@12 | 761 | self.invalidated.update(accessing) |
paul@0 | 762 | if module.name in self.invalidated: |
paul@0 | 763 | self.invalidated.remove(module.name) |
paul@0 | 764 | |
paul@0 | 765 | def source_is_new(self, filename, module_name): |
paul@0 | 766 | |
paul@0 | 767 | "Return whether 'filename' is newer than the cached 'module_name'." |
paul@0 | 768 | |
paul@0 | 769 | if self.cache: |
paul@0 | 770 | cache_filename = join(self.cache, module_name) |
paul@0 | 771 | return not exists(cache_filename) or \ |
paul@0 | 772 | getmtime(filename) > getmtime(cache_filename) or \ |
paul@0 | 773 | module_name in self.invalidated |
paul@0 | 774 | else: |
paul@0 | 775 | return True |
paul@0 | 776 | |
paul@12 | 777 | def load_from_cache(self, filename, module_name): |
paul@0 | 778 | |
paul@0 | 779 | "Return a module residing in the cache." |
paul@0 | 780 | |
paul@0 | 781 | module = self.modules.get(module_name) |
paul@0 | 782 | |
paul@12 | 783 | if not module and not self.source_is_new(filename, module_name): |
paul@13 | 784 | module = CachedModule(module_name, self) |
paul@12 | 785 | self.add_module(module_name, module) |
paul@0 | 786 | |
paul@12 | 787 | filename = join(self.cache, module_name) |
paul@12 | 788 | self._load(module, module_name, lambda m: m.from_cache, filename) |
paul@0 | 789 | |
paul@0 | 790 | return module |
paul@0 | 791 | |
paul@12 | 792 | def _load(self, module, module_name, fn, filename): |
paul@0 | 793 | |
paul@0 | 794 | """ |
paul@12 | 795 | Load 'module' for the given 'module_name', and with 'fn' performing an |
paul@12 | 796 | invocation on the module with the given 'filename'. |
paul@0 | 797 | """ |
paul@0 | 798 | |
paul@12 | 799 | # Load the module. |
paul@0 | 800 | |
paul@0 | 801 | if self.verbose: |
paul@53 | 802 | print >>sys.stderr, module_name in self.required and "Required" or "Loading", module_name, "from", filename |
paul@0 | 803 | fn(module)(filename) |
paul@0 | 804 | |
paul@54 | 805 | # Add the module object if not already defined. |
paul@54 | 806 | |
paul@54 | 807 | if not self.objects.has_key(module_name): |
paul@54 | 808 | self.objects[module_name] = Reference("<module>", module_name) |
paul@54 | 809 | |
paul@0 | 810 | def add_module(self, module_name, module): |
paul@0 | 811 | |
paul@0 | 812 | """ |
paul@0 | 813 | Return the module with the given 'module_name', adding a new module |
paul@0 | 814 | object if one does not already exist. |
paul@0 | 815 | """ |
paul@0 | 816 | |
paul@0 | 817 | self.modules[module_name] = module |
paul@12 | 818 | if module_name in self.to_import: |
paul@12 | 819 | self.to_import.remove(module_name) |
paul@0 | 820 | |
paul@0 | 821 | # vim: tabstop=4 expandtab shiftwidth=4 |