paul@0 | 1 | #!/usr/bin/env python |
paul@0 | 2 | |
paul@0 | 3 | """ |
paul@0 | 4 | Import logic. |
paul@0 | 5 | |
paul@0 | 6 | Copyright (C) 2006, 2007, 2008, 2009, 2010, 2011, 2012, 2013, |
paul@0 | 7 | 2014, 2015, 2016 Paul Boddie <paul@boddie.org.uk> |
paul@0 | 8 | |
paul@0 | 9 | This program is free software; you can redistribute it and/or modify it under |
paul@0 | 10 | the terms of the GNU General Public License as published by the Free Software |
paul@0 | 11 | Foundation; either version 3 of the License, or (at your option) any later |
paul@0 | 12 | version. |
paul@0 | 13 | |
paul@0 | 14 | This program is distributed in the hope that it will be useful, but WITHOUT |
paul@0 | 15 | ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS |
paul@0 | 16 | FOR A PARTICULAR PURPOSE. See the GNU General Public License for more |
paul@0 | 17 | details. |
paul@0 | 18 | |
paul@0 | 19 | You should have received a copy of the GNU General Public License along with |
paul@0 | 20 | this program. If not, see <http://www.gnu.org/licenses/>. |
paul@0 | 21 | """ |
paul@0 | 22 | |
paul@0 | 23 | from errors import ProgramError |
paul@0 | 24 | from os.path import exists, extsep, getmtime, join |
paul@0 | 25 | from os import listdir, makedirs, remove |
paul@0 | 26 | from common import init_item, readfile, writefile |
paul@13 | 27 | from modules import CachedModule |
paul@0 | 28 | from referencing import Reference |
paul@0 | 29 | import inspector |
paul@0 | 30 | import sys |
paul@0 | 31 | |
paul@0 | 32 | class Importer: |
paul@0 | 33 | |
paul@0 | 34 | "An import machine, searching for and loading modules." |
paul@0 | 35 | |
paul@0 | 36 | def __init__(self, path, cache=None, verbose=False): |
paul@0 | 37 | |
paul@0 | 38 | """ |
paul@0 | 39 | Initialise the importer with the given search 'path' - a list of |
paul@0 | 40 | directories to search for Python modules. |
paul@0 | 41 | |
paul@0 | 42 | The optional 'cache' should be the name of a directory used to store |
paul@0 | 43 | cached module information. |
paul@0 | 44 | |
paul@0 | 45 | The optional 'verbose' parameter causes output concerning the activities |
paul@0 | 46 | of the object to be produced if set to a true value (not the default). |
paul@0 | 47 | """ |
paul@0 | 48 | |
paul@0 | 49 | self.path = path |
paul@0 | 50 | self.cache = cache |
paul@0 | 51 | self.verbose = verbose |
paul@0 | 52 | |
paul@12 | 53 | self.to_import = set() |
paul@16 | 54 | self.required = set(["__main__"]) |
paul@24 | 55 | self.removed = {} |
paul@12 | 56 | |
paul@0 | 57 | self.modules = {} |
paul@12 | 58 | self.accessing_modules = {} |
paul@0 | 59 | self.invalidated = set() |
paul@0 | 60 | |
paul@0 | 61 | self.objects = {} |
paul@0 | 62 | self.classes = {} |
paul@0 | 63 | self.function_parameters = {} |
paul@0 | 64 | self.function_defaults = {} |
paul@0 | 65 | self.function_targets = {} |
paul@0 | 66 | self.function_arguments = {} |
paul@0 | 67 | |
paul@0 | 68 | # Derived information. |
paul@0 | 69 | |
paul@0 | 70 | self.subclasses = {} |
paul@0 | 71 | |
paul@0 | 72 | # Attributes of different object types. |
paul@0 | 73 | |
paul@0 | 74 | self.all_class_attrs = {} |
paul@0 | 75 | self.all_instance_attrs = {} |
paul@0 | 76 | self.all_instance_attr_constants = {} |
paul@0 | 77 | self.all_combined_attrs = {} |
paul@0 | 78 | self.all_module_attrs = {} |
paul@0 | 79 | self.all_shadowed_attrs = {} |
paul@0 | 80 | |
paul@0 | 81 | # References to external names and aliases within program units. |
paul@0 | 82 | |
paul@0 | 83 | self.all_name_references = {} |
paul@0 | 84 | self.all_initialised_names = {} |
paul@0 | 85 | self.all_aliased_names = {} |
paul@0 | 86 | |
paul@0 | 87 | # General attribute accesses. |
paul@0 | 88 | |
paul@0 | 89 | self.all_attr_accesses = {} |
paul@0 | 90 | self.all_const_accesses = {} |
paul@0 | 91 | self.all_attr_access_modifiers = {} |
paul@0 | 92 | |
paul@0 | 93 | # Constant literals and values. |
paul@0 | 94 | |
paul@0 | 95 | self.all_constants = {} |
paul@0 | 96 | self.all_constant_values = {} |
paul@0 | 97 | |
paul@0 | 98 | self.make_cache() |
paul@0 | 99 | |
paul@0 | 100 | def make_cache(self): |
paul@0 | 101 | if self.cache and not exists(self.cache): |
paul@0 | 102 | makedirs(self.cache) |
paul@0 | 103 | |
paul@0 | 104 | def check_cache(self, details): |
paul@0 | 105 | |
paul@0 | 106 | """ |
paul@0 | 107 | Check whether the cache applies for the given 'details', invalidating it |
paul@0 | 108 | if it does not. |
paul@0 | 109 | """ |
paul@0 | 110 | |
paul@0 | 111 | recorded_details = self.get_cache_details() |
paul@0 | 112 | |
paul@0 | 113 | if recorded_details != details: |
paul@0 | 114 | self.remove_cache() |
paul@0 | 115 | |
paul@0 | 116 | writefile(self.get_cache_details_filename(), details) |
paul@0 | 117 | |
paul@0 | 118 | def get_cache_details_filename(self): |
paul@0 | 119 | |
paul@0 | 120 | "Return the filename for the cache details." |
paul@0 | 121 | |
paul@0 | 122 | return join(self.cache, "$details") |
paul@0 | 123 | |
paul@0 | 124 | def get_cache_details(self): |
paul@0 | 125 | |
paul@0 | 126 | "Return details of the cache." |
paul@0 | 127 | |
paul@0 | 128 | details_filename = self.get_cache_details_filename() |
paul@0 | 129 | |
paul@0 | 130 | if not exists(details_filename): |
paul@0 | 131 | return None |
paul@0 | 132 | else: |
paul@0 | 133 | return readfile(details_filename) |
paul@0 | 134 | |
paul@0 | 135 | def remove_cache(self): |
paul@0 | 136 | |
paul@0 | 137 | "Remove the contents of the cache." |
paul@0 | 138 | |
paul@0 | 139 | for filename in listdir(self.cache): |
paul@0 | 140 | remove(join(self.cache, filename)) |
paul@0 | 141 | |
paul@0 | 142 | def to_cache(self): |
paul@0 | 143 | |
paul@0 | 144 | "Write modules to the cache." |
paul@0 | 145 | |
paul@0 | 146 | if self.cache: |
paul@0 | 147 | for module_name, module in self.modules.items(): |
paul@0 | 148 | module.to_cache(join(self.cache, module_name)) |
paul@0 | 149 | |
paul@0 | 150 | # Object retrieval and storage. |
paul@0 | 151 | |
paul@0 | 152 | def get_object(self, name): |
paul@0 | 153 | |
paul@0 | 154 | """ |
paul@0 | 155 | Return a reference for the given 'name' or None if no such object |
paul@0 | 156 | exists. |
paul@0 | 157 | """ |
paul@0 | 158 | |
paul@0 | 159 | return self.objects.get(name) |
paul@0 | 160 | |
paul@0 | 161 | def set_object(self, name, value=None): |
paul@0 | 162 | |
paul@0 | 163 | "Set the object with the given 'name' and the given 'value'." |
paul@0 | 164 | |
paul@0 | 165 | if isinstance(value, Reference): |
paul@0 | 166 | ref = value.alias(name) |
paul@0 | 167 | else: |
paul@0 | 168 | ref = Reference(value, name) |
paul@0 | 169 | |
paul@0 | 170 | self.objects[name] = ref |
paul@0 | 171 | |
paul@27 | 172 | # Identification of both stored object names and name references. |
paul@27 | 173 | |
paul@27 | 174 | def identify(self, name): |
paul@27 | 175 | |
paul@27 | 176 | "Identify 'name' using stored object and external name records." |
paul@27 | 177 | |
paul@27 | 178 | return self.objects.get(name) or self.all_name_references.get(name) |
paul@27 | 179 | |
paul@0 | 180 | # Indirect object retrieval. |
paul@0 | 181 | |
paul@0 | 182 | def get_attributes(self, ref, attrname): |
paul@0 | 183 | |
paul@0 | 184 | """ |
paul@0 | 185 | Return attributes provided by 'ref' for 'attrname'. Class attributes |
paul@0 | 186 | may be provided by instances. |
paul@0 | 187 | """ |
paul@0 | 188 | |
paul@0 | 189 | kind = ref.get_kind() |
paul@0 | 190 | if kind == "<class>": |
paul@0 | 191 | ref = self.get_class_attribute(ref.get_origin(), attrname) |
paul@0 | 192 | return ref and set([ref]) or set() |
paul@0 | 193 | elif kind == "<instance>": |
paul@0 | 194 | return self.get_combined_attributes(ref.get_origin(), attrname) |
paul@0 | 195 | elif kind == "<module>": |
paul@0 | 196 | ref = self.get_module_attribute(ref.get_origin(), attrname) |
paul@0 | 197 | return ref and set([ref]) or set() |
paul@0 | 198 | else: |
paul@0 | 199 | return set() |
paul@0 | 200 | |
paul@0 | 201 | def get_class_attribute(self, object_type, attrname): |
paul@0 | 202 | |
paul@0 | 203 | "Return from 'object_type' the details of class attribute 'attrname'." |
paul@0 | 204 | |
paul@0 | 205 | attr = self.all_class_attrs[object_type].get(attrname) |
paul@0 | 206 | return attr and self.get_object(attr) |
paul@0 | 207 | |
paul@0 | 208 | def get_instance_attributes(self, object_type, attrname): |
paul@0 | 209 | |
paul@0 | 210 | """ |
paul@0 | 211 | Return from 'object_type' the details of instance attribute 'attrname'. |
paul@0 | 212 | """ |
paul@0 | 213 | |
paul@0 | 214 | consts = self.all_instance_attr_constants.get(object_type) |
paul@0 | 215 | attrs = set() |
paul@0 | 216 | for attr in self.all_instance_attrs[object_type].get(attrname, []): |
paul@0 | 217 | attrs.add(consts and consts.get(attrname) or Reference("<var>", attr)) |
paul@0 | 218 | return attrs |
paul@0 | 219 | |
paul@0 | 220 | def get_combined_attributes(self, object_type, attrname): |
paul@0 | 221 | |
paul@0 | 222 | """ |
paul@0 | 223 | Return from 'object_type' the details of class or instance attribute |
paul@0 | 224 | 'attrname'. |
paul@0 | 225 | """ |
paul@0 | 226 | |
paul@0 | 227 | ref = self.get_class_attribute(object_type, attrname) |
paul@0 | 228 | refs = ref and set([ref]) or set() |
paul@0 | 229 | refs.update(self.get_instance_attributes(object_type, attrname)) |
paul@0 | 230 | return refs |
paul@0 | 231 | |
paul@0 | 232 | def get_module_attribute(self, object_type, attrname): |
paul@0 | 233 | |
paul@0 | 234 | "Return from 'object_type' the details of module attribute 'attrname'." |
paul@0 | 235 | |
paul@0 | 236 | if attrname in self.all_module_attrs[object_type]: |
paul@0 | 237 | return self.get_object("%s.%s" % (object_type, attrname)) |
paul@0 | 238 | else: |
paul@0 | 239 | return None |
paul@0 | 240 | |
paul@0 | 241 | # Module management. |
paul@0 | 242 | |
paul@16 | 243 | def queue_module(self, name, accessor, required=False): |
paul@12 | 244 | |
paul@12 | 245 | """ |
paul@12 | 246 | Queue the module with the given 'name' for import from the given |
paul@16 | 247 | 'accessor' module. If 'required' is true (it is false by default), the |
paul@16 | 248 | module will be required in the final program. |
paul@12 | 249 | """ |
paul@12 | 250 | |
paul@12 | 251 | if not self.modules.has_key(name): |
paul@12 | 252 | self.to_import.add(name) |
paul@12 | 253 | |
paul@16 | 254 | if required: |
paul@16 | 255 | self.required.add(name) |
paul@16 | 256 | |
paul@12 | 257 | init_item(self.accessing_modules, name, set) |
paul@16 | 258 | self.accessing_modules[name].add(accessor.name) |
paul@12 | 259 | |
paul@0 | 260 | def get_modules(self): |
paul@0 | 261 | |
paul@0 | 262 | "Return all modules known to the importer." |
paul@0 | 263 | |
paul@0 | 264 | return self.modules.values() |
paul@0 | 265 | |
paul@12 | 266 | def get_module(self, name): |
paul@0 | 267 | |
paul@0 | 268 | "Return the module with the given 'name'." |
paul@0 | 269 | |
paul@0 | 270 | if not self.modules.has_key(name): |
paul@0 | 271 | return None |
paul@0 | 272 | |
paul@12 | 273 | return self.modules[name] |
paul@0 | 274 | |
paul@0 | 275 | # Program operations. |
paul@0 | 276 | |
paul@0 | 277 | def initialise(self, filename, reset=False): |
paul@0 | 278 | |
paul@0 | 279 | """ |
paul@0 | 280 | Initialise a program whose main module is 'filename', resetting the |
paul@0 | 281 | cache if 'reset' is true. Return the main module. |
paul@0 | 282 | """ |
paul@0 | 283 | |
paul@0 | 284 | if reset: |
paul@0 | 285 | self.remove_cache() |
paul@0 | 286 | self.check_cache(filename) |
paul@0 | 287 | |
paul@0 | 288 | # Load the program itself. |
paul@0 | 289 | |
paul@0 | 290 | m = self.load_from_file(filename) |
paul@0 | 291 | |
paul@12 | 292 | # Load any queued modules. |
paul@12 | 293 | |
paul@12 | 294 | while self.to_import: |
paul@12 | 295 | for name in list(self.to_import): # avoid mutation issue |
paul@12 | 296 | self.load(name) |
paul@12 | 297 | |
paul@12 | 298 | # Resolve dependencies between modules. |
paul@12 | 299 | |
paul@12 | 300 | self.resolve() |
paul@12 | 301 | |
paul@16 | 302 | # Record the type of all classes. |
paul@16 | 303 | |
paul@16 | 304 | self.type_ref = self.get_object("__builtins__.type") |
paul@16 | 305 | |
paul@0 | 306 | # Resolve dependencies within the program. |
paul@0 | 307 | |
paul@12 | 308 | for module in self.modules.values(): |
paul@12 | 309 | module.complete() |
paul@0 | 310 | |
paul@16 | 311 | # Remove unneeded modules. |
paul@16 | 312 | |
paul@16 | 313 | all_modules = self.modules.items() |
paul@16 | 314 | |
paul@16 | 315 | for name, module in all_modules: |
paul@16 | 316 | if name not in self.required: |
paul@16 | 317 | module.unpropagate() |
paul@16 | 318 | del self.modules[name] |
paul@24 | 319 | self.removed[name] = module |
paul@16 | 320 | |
paul@0 | 321 | return m |
paul@0 | 322 | |
paul@0 | 323 | def finalise(self): |
paul@0 | 324 | |
paul@0 | 325 | "Finalise the inspected program." |
paul@0 | 326 | |
paul@0 | 327 | self.finalise_classes() |
paul@0 | 328 | self.to_cache() |
paul@0 | 329 | self.set_class_types() |
paul@0 | 330 | self.define_instantiators() |
paul@0 | 331 | self.collect_constants() |
paul@0 | 332 | |
paul@12 | 333 | # Supporting operations. |
paul@12 | 334 | |
paul@12 | 335 | def resolve(self): |
paul@12 | 336 | |
paul@12 | 337 | "Resolve dependencies between modules." |
paul@12 | 338 | |
paul@27 | 339 | for d in [self.objects, self.all_name_references]: |
paul@27 | 340 | resolved = {} |
paul@12 | 341 | |
paul@27 | 342 | for name, ref in d.items(): |
paul@27 | 343 | if ref.has_kind("<depends>"): |
paul@27 | 344 | found = self.find_dependency(ref) |
paul@27 | 345 | if found: |
paul@27 | 346 | resolved[name] = found |
paul@27 | 347 | else: |
paul@27 | 348 | print >>sys.stderr, "Name %s references an unknown object: %s" % (name, ref.get_origin()) |
paul@12 | 349 | |
paul@27 | 350 | # Record the resolved names and identify required modules. |
paul@16 | 351 | |
paul@27 | 352 | for name, ref in resolved.items(): |
paul@27 | 353 | d[name] = ref |
paul@12 | 354 | |
paul@32 | 355 | # Find the providing module of this reference. |
paul@32 | 356 | |
paul@27 | 357 | module_name = self.get_module_provider(ref) |
paul@27 | 358 | if module_name: |
paul@27 | 359 | self.required.add(module_name) |
paul@16 | 360 | |
paul@32 | 361 | # Make this module required in all accessing modules. |
paul@32 | 362 | |
paul@32 | 363 | for accessor_name in self.accessing_modules[module_name]: |
paul@32 | 364 | self.modules[accessor_name].required.add(module_name) |
paul@32 | 365 | |
paul@12 | 366 | def find_dependency(self, ref): |
paul@12 | 367 | |
paul@12 | 368 | "Find the ultimate dependency for 'ref'." |
paul@12 | 369 | |
paul@12 | 370 | found = set() |
paul@12 | 371 | while ref and ref.has_kind("<depends>") and not ref in found: |
paul@12 | 372 | found.add(ref) |
paul@12 | 373 | ref = self.objects.get(ref.get_origin()) |
paul@12 | 374 | return ref |
paul@12 | 375 | |
paul@16 | 376 | def get_module_provider(self, ref): |
paul@16 | 377 | |
paul@16 | 378 | "Identify the provider of the given 'ref'." |
paul@16 | 379 | |
paul@16 | 380 | for ancestor in ref.ancestors(): |
paul@16 | 381 | if self.modules.has_key(ancestor): |
paul@16 | 382 | return ancestor |
paul@16 | 383 | return None |
paul@16 | 384 | |
paul@0 | 385 | def finalise_classes(self): |
paul@0 | 386 | |
paul@0 | 387 | "Finalise the class relationships and attributes." |
paul@0 | 388 | |
paul@0 | 389 | self.derive_inherited_attrs() |
paul@0 | 390 | self.derive_subclasses() |
paul@0 | 391 | self.derive_shadowed_attrs() |
paul@0 | 392 | |
paul@0 | 393 | def derive_inherited_attrs(self): |
paul@0 | 394 | |
paul@0 | 395 | "Derive inherited attributes for classes throughout the program." |
paul@0 | 396 | |
paul@0 | 397 | for name in self.classes.keys(): |
paul@0 | 398 | self.propagate_attrs_for_class(name) |
paul@0 | 399 | |
paul@0 | 400 | def propagate_attrs_for_class(self, name, visited=None): |
paul@0 | 401 | |
paul@0 | 402 | "Propagate inherited attributes for class 'name'." |
paul@0 | 403 | |
paul@0 | 404 | # Visit classes only once. |
paul@0 | 405 | |
paul@0 | 406 | if self.all_combined_attrs.has_key(name): |
paul@0 | 407 | return |
paul@0 | 408 | |
paul@0 | 409 | visited = visited or [] |
paul@0 | 410 | |
paul@0 | 411 | if name in visited: |
paul@0 | 412 | raise ProgramError, "Class %s may not inherit from itself: %s -> %s." % (name, " -> ".join(visited), name) |
paul@0 | 413 | |
paul@0 | 414 | visited.append(name) |
paul@0 | 415 | |
paul@0 | 416 | class_attrs = {} |
paul@0 | 417 | instance_attrs = {} |
paul@0 | 418 | |
paul@0 | 419 | # Aggregate the attributes from base classes, recording the origins of |
paul@0 | 420 | # applicable attributes. |
paul@0 | 421 | |
paul@0 | 422 | for base in self.classes[name][::-1]: |
paul@0 | 423 | |
paul@0 | 424 | # Get the identity of the class from the reference. |
paul@0 | 425 | |
paul@0 | 426 | base = base.get_origin() |
paul@0 | 427 | |
paul@0 | 428 | # Define the base class completely before continuing with this |
paul@0 | 429 | # class. |
paul@0 | 430 | |
paul@0 | 431 | self.propagate_attrs_for_class(base, visited) |
paul@0 | 432 | class_attrs.update(self.all_class_attrs[base]) |
paul@0 | 433 | |
paul@0 | 434 | # Instance attribute origins are combined if different. |
paul@0 | 435 | |
paul@0 | 436 | for key, values in self.all_instance_attrs[base].items(): |
paul@0 | 437 | init_item(instance_attrs, key, set) |
paul@0 | 438 | instance_attrs[key].update(values) |
paul@0 | 439 | |
paul@0 | 440 | # Class attributes override those defined earlier in the hierarchy. |
paul@0 | 441 | |
paul@0 | 442 | class_attrs.update(self.all_class_attrs.get(name, {})) |
paul@0 | 443 | |
paul@0 | 444 | # Instance attributes are merely added if not already defined. |
paul@0 | 445 | |
paul@0 | 446 | for key in self.all_instance_attrs.get(name, []): |
paul@0 | 447 | if not instance_attrs.has_key(key): |
paul@0 | 448 | instance_attrs[key] = set(["%s.%s" % (name, key)]) |
paul@0 | 449 | |
paul@0 | 450 | self.all_class_attrs[name] = class_attrs |
paul@0 | 451 | self.all_instance_attrs[name] = instance_attrs |
paul@0 | 452 | self.all_combined_attrs[name] = set(class_attrs.keys()).union(instance_attrs.keys()) |
paul@0 | 453 | |
paul@0 | 454 | def derive_subclasses(self): |
paul@0 | 455 | |
paul@0 | 456 | "Derive subclass details for classes." |
paul@0 | 457 | |
paul@0 | 458 | for name, bases in self.classes.items(): |
paul@0 | 459 | for base in bases: |
paul@0 | 460 | |
paul@0 | 461 | # Get the identity of the class from the reference. |
paul@0 | 462 | |
paul@0 | 463 | base = base.get_origin() |
paul@0 | 464 | self.subclasses[base].add(name) |
paul@0 | 465 | |
paul@0 | 466 | def derive_shadowed_attrs(self): |
paul@0 | 467 | |
paul@0 | 468 | "Derive shadowed attributes for classes." |
paul@0 | 469 | |
paul@0 | 470 | for name, attrs in self.all_instance_attrs.items(): |
paul@0 | 471 | attrs = set(attrs.keys()).intersection(self.all_class_attrs[name].keys()) |
paul@0 | 472 | if attrs: |
paul@0 | 473 | self.all_shadowed_attrs[name] = attrs |
paul@0 | 474 | |
paul@0 | 475 | def set_class_types(self): |
paul@0 | 476 | |
paul@0 | 477 | "Set the type of each class." |
paul@0 | 478 | |
paul@0 | 479 | for attrs in self.all_class_attrs.values(): |
paul@16 | 480 | attrs["__class__"] = self.type_ref.get_origin() |
paul@0 | 481 | |
paul@0 | 482 | def define_instantiators(self): |
paul@0 | 483 | |
paul@0 | 484 | """ |
paul@0 | 485 | Consolidate parameter and default details, incorporating initialiser |
paul@0 | 486 | details to define instantiator signatures. |
paul@0 | 487 | """ |
paul@0 | 488 | |
paul@0 | 489 | for cls, attrs in self.all_class_attrs.items(): |
paul@0 | 490 | initialiser = attrs["__init__"] |
paul@0 | 491 | self.function_parameters[cls] = self.function_parameters[initialiser][1:] |
paul@0 | 492 | self.function_defaults[cls] = self.function_defaults[initialiser] |
paul@0 | 493 | |
paul@0 | 494 | def collect_constants(self): |
paul@0 | 495 | |
paul@0 | 496 | "Get constants from all active modules." |
paul@0 | 497 | |
paul@0 | 498 | for module in self.modules.values(): |
paul@0 | 499 | self.all_constants.update(module.constants) |
paul@0 | 500 | |
paul@0 | 501 | # Import methods. |
paul@0 | 502 | |
paul@0 | 503 | def find_in_path(self, name): |
paul@0 | 504 | |
paul@0 | 505 | """ |
paul@0 | 506 | Find the given module 'name' in the search path, returning None where no |
paul@0 | 507 | such module could be found, or a 2-tuple from the 'find' method |
paul@0 | 508 | otherwise. |
paul@0 | 509 | """ |
paul@0 | 510 | |
paul@0 | 511 | for d in self.path: |
paul@0 | 512 | m = self.find(d, name) |
paul@0 | 513 | if m: return m |
paul@0 | 514 | return None |
paul@0 | 515 | |
paul@0 | 516 | def find(self, d, name): |
paul@0 | 517 | |
paul@0 | 518 | """ |
paul@0 | 519 | In the directory 'd', find the given module 'name', where 'name' can |
paul@0 | 520 | either refer to a single file module or to a package. Return None if the |
paul@0 | 521 | 'name' cannot be associated with either a file or a package directory, |
paul@0 | 522 | or a 2-tuple from '_find_package' or '_find_module' otherwise. |
paul@0 | 523 | """ |
paul@0 | 524 | |
paul@0 | 525 | m = self._find_package(d, name) |
paul@0 | 526 | if m: return m |
paul@0 | 527 | m = self._find_module(d, name) |
paul@0 | 528 | if m: return m |
paul@0 | 529 | return None |
paul@0 | 530 | |
paul@0 | 531 | def _find_module(self, d, name): |
paul@0 | 532 | |
paul@0 | 533 | """ |
paul@0 | 534 | In the directory 'd', find the given module 'name', returning None where |
paul@0 | 535 | no suitable file exists in the directory, or a 2-tuple consisting of |
paul@0 | 536 | None (indicating that no package directory is involved) and a filename |
paul@0 | 537 | indicating the location of the module. |
paul@0 | 538 | """ |
paul@0 | 539 | |
paul@0 | 540 | name_py = name + extsep + "py" |
paul@0 | 541 | filename = self._find_file(d, name_py) |
paul@0 | 542 | if filename: |
paul@0 | 543 | return None, filename |
paul@0 | 544 | return None |
paul@0 | 545 | |
paul@0 | 546 | def _find_package(self, d, name): |
paul@0 | 547 | |
paul@0 | 548 | """ |
paul@0 | 549 | In the directory 'd', find the given package 'name', returning None |
paul@0 | 550 | where no suitable package directory exists, or a 2-tuple consisting of |
paul@0 | 551 | a directory (indicating the location of the package directory itself) |
paul@0 | 552 | and a filename indicating the location of the __init__.py module which |
paul@0 | 553 | declares the package's top-level contents. |
paul@0 | 554 | """ |
paul@0 | 555 | |
paul@0 | 556 | filename = self._find_file(d, name) |
paul@0 | 557 | if filename: |
paul@0 | 558 | init_py = "__init__" + extsep + "py" |
paul@0 | 559 | init_py_filename = self._find_file(filename, init_py) |
paul@0 | 560 | if init_py_filename: |
paul@0 | 561 | return filename, init_py_filename |
paul@0 | 562 | return None |
paul@0 | 563 | |
paul@0 | 564 | def _find_file(self, d, filename): |
paul@0 | 565 | |
paul@0 | 566 | """ |
paul@0 | 567 | Return the filename obtained when searching the directory 'd' for the |
paul@0 | 568 | given 'filename', or None if no actual file exists for the filename. |
paul@0 | 569 | """ |
paul@0 | 570 | |
paul@0 | 571 | filename = join(d, filename) |
paul@0 | 572 | if exists(filename): |
paul@0 | 573 | return filename |
paul@0 | 574 | else: |
paul@0 | 575 | return None |
paul@0 | 576 | |
paul@12 | 577 | def load(self, name): |
paul@0 | 578 | |
paul@0 | 579 | """ |
paul@0 | 580 | Load the module or package with the given 'name'. Return an object |
paul@0 | 581 | referencing the loaded module or package, or None if no such module or |
paul@0 | 582 | package exists. |
paul@0 | 583 | """ |
paul@0 | 584 | |
paul@0 | 585 | # Loaded modules are returned immediately. |
paul@0 | 586 | # Modules may be known but not yet loading (having been registered as |
paul@0 | 587 | # submodules), loading, loaded, or completely unknown. |
paul@0 | 588 | |
paul@12 | 589 | module = self.get_module(name) |
paul@0 | 590 | |
paul@0 | 591 | if module: |
paul@12 | 592 | return self.modules[name] |
paul@0 | 593 | |
paul@0 | 594 | # Otherwise, modules are loaded. |
paul@0 | 595 | |
paul@0 | 596 | if self.verbose: |
paul@0 | 597 | print >>sys.stderr, "Loading", name |
paul@0 | 598 | |
paul@0 | 599 | # Split the name into path components, and try to find the uppermost in |
paul@0 | 600 | # the search path. |
paul@0 | 601 | |
paul@0 | 602 | path = name.split(".") |
paul@0 | 603 | path_so_far = [] |
paul@12 | 604 | module = None |
paul@0 | 605 | |
paul@0 | 606 | for p in path: |
paul@0 | 607 | |
paul@0 | 608 | # Get the module's filesystem details. |
paul@0 | 609 | |
paul@0 | 610 | if not path_so_far: |
paul@0 | 611 | m = self.find_in_path(p) |
paul@0 | 612 | elif d: |
paul@0 | 613 | m = self.find(d, p) |
paul@0 | 614 | else: |
paul@0 | 615 | m = None |
paul@0 | 616 | |
paul@0 | 617 | path_so_far.append(p) |
paul@0 | 618 | module_name = ".".join(path_so_far) |
paul@0 | 619 | |
paul@0 | 620 | if not m: |
paul@0 | 621 | if self.verbose: |
paul@0 | 622 | print >>sys.stderr, "Not found (%s)" % name |
paul@0 | 623 | |
paul@0 | 624 | return None # NOTE: Import error. |
paul@0 | 625 | |
paul@0 | 626 | # Get the module itself. |
paul@0 | 627 | |
paul@0 | 628 | d, filename = m |
paul@12 | 629 | module = self.load_from_file(filename, module_name) |
paul@0 | 630 | |
paul@12 | 631 | return module |
paul@0 | 632 | |
paul@12 | 633 | def load_from_file(self, filename, module_name=None): |
paul@0 | 634 | |
paul@0 | 635 | "Load the module from the given 'filename'." |
paul@0 | 636 | |
paul@0 | 637 | if module_name is None: |
paul@0 | 638 | module_name = "__main__" |
paul@0 | 639 | |
paul@0 | 640 | module = self.modules.get(module_name) |
paul@0 | 641 | |
paul@0 | 642 | if not module: |
paul@0 | 643 | |
paul@0 | 644 | # Try to load from cache. |
paul@0 | 645 | |
paul@12 | 646 | module = self.load_from_cache(filename, module_name) |
paul@0 | 647 | if module: |
paul@0 | 648 | return module |
paul@0 | 649 | |
paul@0 | 650 | # If no cache entry exists, load from file. |
paul@0 | 651 | |
paul@0 | 652 | module = inspector.InspectedModule(module_name, self) |
paul@0 | 653 | self.add_module(module_name, module) |
paul@0 | 654 | self.update_cache_validity(module) |
paul@0 | 655 | |
paul@12 | 656 | self._load(module, module_name, lambda m: m.parse, filename) |
paul@0 | 657 | |
paul@0 | 658 | return module |
paul@0 | 659 | |
paul@0 | 660 | def update_cache_validity(self, module): |
paul@0 | 661 | |
paul@0 | 662 | "Make 'module' valid in the cache, but invalidate accessing modules." |
paul@0 | 663 | |
paul@12 | 664 | accessing = self.accessing_modules.get(module.name) |
paul@12 | 665 | if accessing: |
paul@12 | 666 | self.invalidated.update(accessing) |
paul@0 | 667 | if module.name in self.invalidated: |
paul@0 | 668 | self.invalidated.remove(module.name) |
paul@0 | 669 | |
paul@0 | 670 | def source_is_new(self, filename, module_name): |
paul@0 | 671 | |
paul@0 | 672 | "Return whether 'filename' is newer than the cached 'module_name'." |
paul@0 | 673 | |
paul@0 | 674 | if self.cache: |
paul@0 | 675 | cache_filename = join(self.cache, module_name) |
paul@0 | 676 | return not exists(cache_filename) or \ |
paul@0 | 677 | getmtime(filename) > getmtime(cache_filename) or \ |
paul@0 | 678 | module_name in self.invalidated |
paul@0 | 679 | else: |
paul@0 | 680 | return True |
paul@0 | 681 | |
paul@12 | 682 | def load_from_cache(self, filename, module_name): |
paul@0 | 683 | |
paul@0 | 684 | "Return a module residing in the cache." |
paul@0 | 685 | |
paul@0 | 686 | module = self.modules.get(module_name) |
paul@0 | 687 | |
paul@12 | 688 | if not module and not self.source_is_new(filename, module_name): |
paul@13 | 689 | module = CachedModule(module_name, self) |
paul@12 | 690 | self.add_module(module_name, module) |
paul@0 | 691 | |
paul@12 | 692 | filename = join(self.cache, module_name) |
paul@12 | 693 | self._load(module, module_name, lambda m: m.from_cache, filename) |
paul@0 | 694 | |
paul@0 | 695 | return module |
paul@0 | 696 | |
paul@12 | 697 | def _load(self, module, module_name, fn, filename): |
paul@0 | 698 | |
paul@0 | 699 | """ |
paul@12 | 700 | Load 'module' for the given 'module_name', and with 'fn' performing an |
paul@12 | 701 | invocation on the module with the given 'filename'. |
paul@0 | 702 | """ |
paul@0 | 703 | |
paul@12 | 704 | # Load the module. |
paul@0 | 705 | |
paul@0 | 706 | if self.verbose: |
paul@0 | 707 | print >>sys.stderr, "Loading", filename |
paul@0 | 708 | fn(module)(filename) |
paul@0 | 709 | if self.verbose: |
paul@0 | 710 | print >>sys.stderr, "Loaded", filename |
paul@0 | 711 | |
paul@0 | 712 | def add_module(self, module_name, module): |
paul@0 | 713 | |
paul@0 | 714 | """ |
paul@0 | 715 | Return the module with the given 'module_name', adding a new module |
paul@0 | 716 | object if one does not already exist. |
paul@0 | 717 | """ |
paul@0 | 718 | |
paul@0 | 719 | self.modules[module_name] = module |
paul@0 | 720 | self.objects[module_name] = Reference("<module>", module_name) |
paul@12 | 721 | if module_name in self.to_import: |
paul@12 | 722 | self.to_import.remove(module_name) |
paul@0 | 723 | |
paul@0 | 724 | # vim: tabstop=4 expandtab shiftwidth=4 |