import py import os import inspect from py.__.apigen.layout import LayoutPage from py.__.apigen.source import browser as source_browser from py.__.apigen.source import html as source_html from py.__.apigen.source import color as source_color from py.__.apigen.tracer.description import is_private from py.__.apigen.rest.genrest import split_of_last_part from py.__.apigen.linker import relpath from py.__.apigen.html import H sorted = py.builtin.sorted html = py.xml.html raw = py.xml.raw def is_navigateable(name): return (not is_private(name) and name != '__doc__') def show_property(name): if not name.startswith('_'): return True if name.startswith('__') and name.endswith('__'): # XXX do we need to skip more manually here? if (name not in dir(object) and name not in ['__doc__', '__dict__', '__name__', '__module__', '__weakref__']): return True return False def deindent(str, linesep='\n'): """ de-indent string can be used to de-indent Python docstrings, it de-indents the first line to the side always, and determines the indentation of the rest of the text by taking that of the least indented (filled) line """ lines = str.strip().split(linesep) normalized = [] deindent = None normalized.append(lines[0].strip()) # replace tabs with spaces, empty lines that contain spaces only, and # find out what the smallest indentation is for line in lines[1:]: line = line.replace('\t', ' ' * 4) stripped = line.strip() if not stripped: normalized.append('') else: rstripped = line.rstrip() indent = len(rstripped) - len(stripped) if deindent is None or indent < deindent: deindent = indent normalized.append(line) ret = [normalized[0]] for line in normalized[1:]: if not line: ret.append(line) else: ret.append(line[deindent:]) return '%s\n' % (linesep.join(ret),) def get_linesep(s, default='\n'): """ return the line seperator of a string returns 'default' if no seperator can be found """ for sep in ('\r\n', '\r', '\n'): if sep in s: return sep return default def get_param_htmldesc(linker, func): """ get the html for the parameters of a function """ import inspect # XXX copy and modify formatargspec to produce html return inspect.formatargspec(*inspect.getargspec(func)) # some helper functionality def source_dirs_files(fspath): """ returns a tuple (dirs, files) for fspath dirs are all the subdirs, files are the files which are interesting in building source documentation for a Python code tree (basically all normal files excluding .pyc and .pyo ones) all files and dirs that have a name starting with . are considered hidden """ dirs = [] files = [] for child in fspath.listdir(): if child.basename.startswith('.'): continue if child.check(dir=True): dirs.append(child) elif child.check(file=True): if child.ext in ['.pyc', '.pyo']: continue files.append(child) return sorted(dirs), sorted(files) def create_namespace_tree(dotted_names): """ creates a tree (in dict form) from a set of dotted names """ ret = {} for dn in dotted_names: path = dn.split('.') for i in xrange(len(path)): ns = '.'.join(path[:i]) itempath = '.'.join(path[:i + 1]) if ns not in ret: ret[ns] = [] if itempath not in ret[ns]: ret[ns].append(itempath) return ret def wrap_page(project, title, contentel, navel, relbase, basepath): page = LayoutPage(project, title, nav=navel, encoding='UTF-8', relpath=relbase) page.set_content(contentel) page.setup_scripts_styles(basepath) return page # the PageBuilder classes take care of producing the docs (using the stuff # above) class AbstractPageBuilder(object): def write_page(self, title, reltargetpath, project, tag, nav): targetpath = self.base.join(reltargetpath) relbase= relpath('%s%s' % (targetpath.dirpath(), targetpath.sep), self.base.strpath + '/') page = wrap_page(project, title, tag, nav, relbase, self.base) content = self.linker.call_withbase(reltargetpath, page.unicode) targetpath.ensure() targetpath.write(content.encode("utf8")) class SourcePageBuilder(AbstractPageBuilder): """ builds the html for a source docs page """ def __init__(self, base, linker, projroot, capture=None): self.base = base self.linker = linker self.projroot = projroot self.capture = capture def build_navigation(self, fspath): nav = H.Navigation(class_='sidebar') relpath = fspath.relto(self.projroot) path = relpath.split(os.path.sep) indent = 0 # build links to parents if relpath != '': for i in xrange(len(path)): dirpath = os.path.sep.join(path[:i]) abspath = self.projroot.join(dirpath).strpath if i == 0: text = self.projroot.basename else: text = path[i-1] nav.append(H.NavigationItem(self.linker, abspath, text, indent, False)) indent += 1 # build siblings or children and self if fspath.check(dir=True): # we're a dir, build ourselves and our children dirpath = fspath nav.append(H.NavigationItem(self.linker, dirpath.strpath, dirpath.basename, indent, True)) indent += 1 elif fspath.strpath == self.projroot.strpath: dirpath = fspath else: # we're a file, build our parent's children only dirpath = fspath.dirpath() diritems, fileitems = source_dirs_files(dirpath) for dir in diritems: nav.append(H.NavigationItem(self.linker, dir.strpath, dir.basename, indent, False)) for file in fileitems: selected = (fspath.check(file=True) and file.basename == fspath.basename) nav.append(H.NavigationItem(self.linker, file.strpath, file.basename, indent, selected)) return nav re = py.std.re _reg_body = re.compile(r'
]*>(.*)', re.S) def build_python_page(self, fspath): # XXX two reads of the same file here... not very bad (disk caches # and such) but also not very nice... enc = source_html.get_module_encoding(fspath.strpath) source = fspath.read() sep = get_linesep(source) colored = enumerate_and_color(source.split(sep), 0, enc) tag = H.SourceDef(*colored) nav = self.build_navigation(fspath) return tag, nav def build_dir_page(self, fspath): dirs, files = source_dirs_files(fspath) dirs = [(p.basename, self.linker.get_lazyhref(str(p))) for p in dirs] files = [(p.basename, self.linker.get_lazyhref(str(p))) for p in files] tag = H.DirList(dirs, files) nav = self.build_navigation(fspath) return tag, nav def build_nonpython_page(self, fspath): try: tag = H.NonPythonSource(unicode(fspath.read(), 'utf-8')) except UnicodeError: # XXX we should fix non-ascii support here!! tag = H.NonPythonSource('no source available (binary file?)') nav = self.build_navigation(fspath) return tag, nav def prepare_pages(self, base): passed = [] for fspath in [base] + list(base.visit()): if fspath.ext in ['.pyc', '.pyo']: continue relfspath = fspath.relto(base) if relfspath.find('%s.' % (os.path.sep,)) > -1: # skip hidden dirs and files continue elif fspath.check(dir=True): if relfspath != '': relfspath += os.path.sep reloutputpath = 'source%s%sindex.html' % (os.path.sep, relfspath) else: reloutputpath = "source%s%s.html" % (os.path.sep, relfspath) reloutputpath = reloutputpath.replace(os.path.sep, '/') outputpath = self.base.join(reloutputpath) self.linker.set_link(str(fspath), reloutputpath) passed.append((fspath, outputpath)) return passed def build_pages(self, data, project, base): """ build syntax-colored source views """ for fspath, outputpath in data: if fspath.check(ext='.py'): try: tag, nav = self.build_python_page(fspath) except (KeyboardInterrupt, SystemError): raise except: # XXX strange stuff going wrong at times... need to fix raise exc, e, tb = py.std.sys.exc_info() print '%s - %s' % (exc, e) print print ''.join(py.std.traceback.format_tb(tb)) print '-' * 79 del tb tag, nav = self.build_nonpython_page(fspath) elif fspath.check(dir=True): tag, nav = self.build_dir_page(fspath) else: tag, nav = self.build_nonpython_page(fspath) title = 'sources for %s' % (fspath.basename,) reltargetpath = outputpath.relto(self.base).replace(os.path.sep, '/') self.write_page(title, reltargetpath, project, tag, nav) def enumerate_and_color(codelines, firstlineno, enc): tokenizer = source_color.Tokenizer(source_color.PythonSchema) colored = [] for i, line in enumerate(codelines): try: colored.append(H.span('%04s: ' % (i + firstlineno + 1))) colored.append(source_html.prepare_line([line], tokenizer, enc)) colored.append('\n') except py.error.ENOENT: # error reading source code, giving up colored = org break return colored def get_obj(pkg, dotted_name): full_dotted_name = '%s.%s' % (pkg.__name__, dotted_name) if dotted_name == '': return pkg path = dotted_name.split('.') ret = pkg for item in path: marker = [] ret = getattr(ret, item, marker) if ret is marker: raise NameError('can not access %s in %s' % (item, full_dotted_name)) return ret class ApiPageBuilder(AbstractPageBuilder): """ builds the html for an api docs page """ def __init__(self, base, linker, dsa, projroot, namespace_tree, capture=None): self.base = base self.linker = linker self.dsa = dsa self.projroot = projroot self.projpath = py.path.local(projroot) self.namespace_tree = namespace_tree self.capture = capture pkgname = self.dsa.get_module_name().split('/')[-1] self.pkg = __import__(pkgname) def build_callable_view(self, dotted_name): """ build the html for a class method """ # XXX we may want to have seperate func = get_obj(self.pkg, dotted_name) docstring = func.__doc__ if docstring: docstring = deindent(docstring) localname = func.__name__ argdesc = get_param_htmldesc(self.linker, func) valuedesc = self.build_callable_signature_description(dotted_name) sourcefile = inspect.getsourcefile(func) callable_source = self.dsa.get_function_source(dotted_name) # i assume they're both either available or unavailable(XXX ?) is_in_pkg = self.is_in_pkg(sourcefile) href = None text = 'could not get to source file' colored = [] if sourcefile and callable_source: enc = source_html.get_module_encoding(sourcefile) tokenizer = source_color.Tokenizer(source_color.PythonSchema) firstlineno = func.func_code.co_firstlineno sep = get_linesep(callable_source) org = callable_source.split(sep) colored = enumerate_and_color(org, firstlineno, enc) text = 'source: %s' % (sourcefile,) if is_in_pkg: href = self.linker.get_lazyhref(sourcefile) csource = H.SourceSnippet(text, href, colored) callstack = self.dsa.get_function_callpoints(dotted_name) csitems = [] for cs, _ in callstack: csitems.append(self.build_callsite(dotted_name, cs)) snippet = H.FunctionDescription(localname, argdesc, docstring, valuedesc, csource, csitems) return snippet def build_class_view(self, dotted_name): """ build the html for a class """ cls = get_obj(self.pkg, dotted_name) # XXX is this a safe check? try: sourcefile = inspect.getsourcefile(cls) except TypeError: sourcelink = 'builtin file, no source available' else: if sourcefile is None: sourcelink = H.div('no source available') else: if sourcefile[-1] in ['o', 'c']: sourcefile = sourcefile[:-1] sourcelink = H.div(H.a('view source', href=self.linker.get_lazyhref(sourcefile))) docstring = cls.__doc__ if docstring: docstring = deindent(docstring) if not hasattr(cls, '__name__'): clsname = 'instance of %s' % (cls.__class__.__name__,) else: clsname = cls.__name__ bases = self.build_bases(dotted_name) properties = self.build_properties(cls) methods = self.build_methods(dotted_name) snippet = H.ClassDescription( # XXX bases HTML H.ClassDef('%s(' % (clsname,), *bases), H.Docstring(docstring or '*no docstring available*'), sourcelink, *(properties+methods) ) return snippet def build_bases(self, dotted_name): basehtml = [] bases = self.dsa.get_possible_base_classes(dotted_name) for base in bases: try: obj = self.dsa.get_obj(base.name) except KeyError: basehtml.append(base.name) else: href = self.linker.get_lazyhref(base.name) basehtml.append(H.BaseDescription(base.name, href=href)) basehtml.append(',') if basehtml: basehtml.pop() basehtml.append('):') return basehtml def build_properties(self, cls): properties = [] for attr in dir(cls): val = getattr(cls, attr) if show_property(attr) and not callable(val): if isinstance(val, property): val = '