Spaces:
Build error
Build error
""" | |
A Cython plugin for coverage.py | |
Requires the coverage package at least in version 4.0 (which added the plugin API). | |
""" | |
from __future__ import absolute_import | |
import re | |
import os.path | |
import sys | |
from collections import defaultdict | |
from coverage.plugin import CoveragePlugin, FileTracer, FileReporter # requires coverage.py 4.0+ | |
from coverage.files import canonical_filename | |
from .Utils import find_root_package_dir, is_package_dir, open_source_file | |
from . import __version__ | |
C_FILE_EXTENSIONS = ['.c', '.cpp', '.cc', '.cxx'] | |
MODULE_FILE_EXTENSIONS = set(['.py', '.pyx', '.pxd'] + C_FILE_EXTENSIONS) | |
def _find_c_source(base_path): | |
file_exists = os.path.exists | |
for ext in C_FILE_EXTENSIONS: | |
file_name = base_path + ext | |
if file_exists(file_name): | |
return file_name | |
return None | |
def _find_dep_file_path(main_file, file_path, relative_path_search=False): | |
abs_path = os.path.abspath(file_path) | |
if not os.path.exists(abs_path) and (file_path.endswith('.pxi') or | |
relative_path_search): | |
# files are looked up relative to the main source file | |
rel_file_path = os.path.join(os.path.dirname(main_file), file_path) | |
if os.path.exists(rel_file_path): | |
abs_path = os.path.abspath(rel_file_path) | |
# search sys.path for external locations if a valid file hasn't been found | |
if not os.path.exists(abs_path): | |
for sys_path in sys.path: | |
test_path = os.path.realpath(os.path.join(sys_path, file_path)) | |
if os.path.exists(test_path): | |
return canonical_filename(test_path) | |
return canonical_filename(abs_path) | |
class Plugin(CoveragePlugin): | |
# map from traced file paths to absolute file paths | |
_file_path_map = None | |
# map from traced file paths to corresponding C files | |
_c_files_map = None | |
# map from parsed C files to their content | |
_parsed_c_files = None | |
def sys_info(self): | |
return [('Cython version', __version__)] | |
def file_tracer(self, filename): | |
""" | |
Try to find a C source file for a file path found by the tracer. | |
""" | |
if filename.startswith('<') or filename.startswith('memory:'): | |
return None | |
c_file = py_file = None | |
filename = canonical_filename(os.path.abspath(filename)) | |
if self._c_files_map and filename in self._c_files_map: | |
c_file = self._c_files_map[filename][0] | |
if c_file is None: | |
c_file, py_file = self._find_source_files(filename) | |
if not c_file: | |
return None # unknown file | |
# parse all source file paths and lines from C file | |
# to learn about all relevant source files right away (pyx/pxi/pxd) | |
# FIXME: this might already be too late if the first executed line | |
# is not from the main .pyx file but a file with a different | |
# name than the .c file (which prevents us from finding the | |
# .c file) | |
_, code = self._read_source_lines(c_file, filename) | |
if code is None: | |
return None # no source found | |
if self._file_path_map is None: | |
self._file_path_map = {} | |
return CythonModuleTracer(filename, py_file, c_file, self._c_files_map, self._file_path_map) | |
def file_reporter(self, filename): | |
# TODO: let coverage.py handle .py files itself | |
#ext = os.path.splitext(filename)[1].lower() | |
#if ext == '.py': | |
# from coverage.python import PythonFileReporter | |
# return PythonFileReporter(filename) | |
filename = canonical_filename(os.path.abspath(filename)) | |
if self._c_files_map and filename in self._c_files_map: | |
c_file, rel_file_path, code = self._c_files_map[filename] | |
else: | |
c_file, _ = self._find_source_files(filename) | |
if not c_file: | |
return None # unknown file | |
rel_file_path, code = self._read_source_lines(c_file, filename) | |
if code is None: | |
return None # no source found | |
return CythonModuleReporter(c_file, filename, rel_file_path, code) | |
def _find_source_files(self, filename): | |
basename, ext = os.path.splitext(filename) | |
ext = ext.lower() | |
if ext in MODULE_FILE_EXTENSIONS: | |
pass | |
elif ext == '.pyd': | |
# Windows extension module | |
platform_suffix = re.search(r'[.]cp[0-9]+-win[_a-z0-9]*$', basename, re.I) | |
if platform_suffix: | |
basename = basename[:platform_suffix.start()] | |
elif ext == '.so': | |
# Linux/Unix/Mac extension module | |
platform_suffix = re.search(r'[.](?:cpython|pypy)-[0-9]+[-_a-z0-9]*$', basename, re.I) | |
if platform_suffix: | |
basename = basename[:platform_suffix.start()] | |
elif ext == '.pxi': | |
# if we get here, it means that the first traced line of a Cython module was | |
# not in the main module but in an include file, so try a little harder to | |
# find the main source file | |
self._find_c_source_files(os.path.dirname(filename), filename) | |
if filename in self._c_files_map: | |
return self._c_files_map[filename][0], None | |
else: | |
# none of our business | |
return None, None | |
c_file = filename if ext in C_FILE_EXTENSIONS else _find_c_source(basename) | |
if c_file is None: | |
# a module "pkg/mod.so" can have a source file "pkg/pkg.mod.c" | |
package_root = find_root_package_dir.uncached(filename) | |
package_path = os.path.relpath(basename, package_root).split(os.path.sep) | |
if len(package_path) > 1: | |
test_basepath = os.path.join(os.path.dirname(filename), '.'.join(package_path)) | |
c_file = _find_c_source(test_basepath) | |
py_source_file = None | |
if c_file: | |
py_source_file = os.path.splitext(c_file)[0] + '.py' | |
if not os.path.exists(py_source_file): | |
py_source_file = None | |
try: | |
with open(c_file, 'rb') as f: | |
if b'/* Generated by Cython ' not in f.read(30): | |
return None, None # not a Cython file | |
except (IOError, OSError): | |
c_file = None | |
return c_file, py_source_file | |
def _find_c_source_files(self, dir_path, source_file): | |
""" | |
Desperately parse all C files in the directory or its package parents | |
(not re-descending) to find the (included) source file in one of them. | |
""" | |
if not os.path.isdir(dir_path): | |
return | |
splitext = os.path.splitext | |
for filename in os.listdir(dir_path): | |
ext = splitext(filename)[1].lower() | |
if ext in C_FILE_EXTENSIONS: | |
self._read_source_lines(os.path.join(dir_path, filename), source_file) | |
if source_file in self._c_files_map: | |
return | |
# not found? then try one package up | |
if is_package_dir(dir_path): | |
self._find_c_source_files(os.path.dirname(dir_path), source_file) | |
def _read_source_lines(self, c_file, sourcefile): | |
""" | |
Parse a Cython generated C/C++ source file and find the executable lines. | |
Each executable line starts with a comment header that states source file | |
and line number, as well as the surrounding range of source code lines. | |
""" | |
if self._parsed_c_files is None: | |
self._parsed_c_files = {} | |
if c_file in self._parsed_c_files: | |
code_lines = self._parsed_c_files[c_file] | |
else: | |
code_lines = self._parse_cfile_lines(c_file) | |
self._parsed_c_files[c_file] = code_lines | |
if self._c_files_map is None: | |
self._c_files_map = {} | |
for filename, code in code_lines.items(): | |
abs_path = _find_dep_file_path(c_file, filename, | |
relative_path_search=True) | |
self._c_files_map[abs_path] = (c_file, filename, code) | |
if sourcefile not in self._c_files_map: | |
return (None,) * 2 # e.g. shared library file | |
return self._c_files_map[sourcefile][1:] | |
def _parse_cfile_lines(self, c_file): | |
""" | |
Parse a C file and extract all source file lines that generated executable code. | |
""" | |
match_source_path_line = re.compile(r' */[*] +"(.*)":([0-9]+)$').match | |
match_current_code_line = re.compile(r' *[*] (.*) # <<<<<<+$').match | |
match_comment_end = re.compile(r' *[*]/$').match | |
match_trace_line = re.compile(r' *__Pyx_TraceLine\(([0-9]+),').match | |
not_executable = re.compile( | |
r'\s*c(?:type)?def\s+' | |
r'(?:(?:public|external)\s+)?' | |
r'(?:struct|union|enum|class)' | |
r'(\s+[^:]+|)\s*:' | |
).match | |
code_lines = defaultdict(dict) | |
executable_lines = defaultdict(set) | |
current_filename = None | |
with open(c_file) as lines: | |
lines = iter(lines) | |
for line in lines: | |
match = match_source_path_line(line) | |
if not match: | |
if '__Pyx_TraceLine(' in line and current_filename is not None: | |
trace_line = match_trace_line(line) | |
if trace_line: | |
executable_lines[current_filename].add(int(trace_line.group(1))) | |
continue | |
filename, lineno = match.groups() | |
current_filename = filename | |
lineno = int(lineno) | |
for comment_line in lines: | |
match = match_current_code_line(comment_line) | |
if match: | |
code_line = match.group(1).rstrip() | |
if not_executable(code_line): | |
break | |
code_lines[filename][lineno] = code_line | |
break | |
elif match_comment_end(comment_line): | |
# unexpected comment format - false positive? | |
break | |
# Remove lines that generated code but are not traceable. | |
for filename, lines in code_lines.items(): | |
dead_lines = set(lines).difference(executable_lines.get(filename, ())) | |
for lineno in dead_lines: | |
del lines[lineno] | |
return code_lines | |
class CythonModuleTracer(FileTracer): | |
""" | |
Find the Python/Cython source file for a Cython module. | |
""" | |
def __init__(self, module_file, py_file, c_file, c_files_map, file_path_map): | |
super(CythonModuleTracer, self).__init__() | |
self.module_file = module_file | |
self.py_file = py_file | |
self.c_file = c_file | |
self._c_files_map = c_files_map | |
self._file_path_map = file_path_map | |
def has_dynamic_source_filename(self): | |
return True | |
def dynamic_source_filename(self, filename, frame): | |
""" | |
Determine source file path. Called by the function call tracer. | |
""" | |
source_file = frame.f_code.co_filename | |
try: | |
return self._file_path_map[source_file] | |
except KeyError: | |
pass | |
abs_path = _find_dep_file_path(filename, source_file) | |
if self.py_file and source_file[-3:].lower() == '.py': | |
# always let coverage.py handle this case itself | |
self._file_path_map[source_file] = self.py_file | |
return self.py_file | |
assert self._c_files_map is not None | |
if abs_path not in self._c_files_map: | |
self._c_files_map[abs_path] = (self.c_file, source_file, None) | |
self._file_path_map[source_file] = abs_path | |
return abs_path | |
class CythonModuleReporter(FileReporter): | |
""" | |
Provide detailed trace information for one source file to coverage.py. | |
""" | |
def __init__(self, c_file, source_file, rel_file_path, code): | |
super(CythonModuleReporter, self).__init__(source_file) | |
self.name = rel_file_path | |
self.c_file = c_file | |
self._code = code | |
def lines(self): | |
""" | |
Return set of line numbers that are possibly executable. | |
""" | |
return set(self._code) | |
def _iter_source_tokens(self): | |
current_line = 1 | |
for line_no, code_line in sorted(self._code.items()): | |
while line_no > current_line: | |
yield [] | |
current_line += 1 | |
yield [('txt', code_line)] | |
current_line += 1 | |
def source(self): | |
""" | |
Return the source code of the file as a string. | |
""" | |
if os.path.exists(self.filename): | |
with open_source_file(self.filename) as f: | |
return f.read() | |
else: | |
return '\n'.join( | |
(tokens[0][1] if tokens else '') | |
for tokens in self._iter_source_tokens()) | |
def source_token_lines(self): | |
""" | |
Iterate over the source code tokens. | |
""" | |
if os.path.exists(self.filename): | |
with open_source_file(self.filename) as f: | |
for line in f: | |
yield [('txt', line.rstrip('\n'))] | |
else: | |
for line in self._iter_source_tokens(): | |
yield [('txt', line)] | |
def coverage_init(reg, options): | |
reg.add_file_tracer(Plugin()) | |