pydiffchecker/pydiffchecker/line_shift_checker.py

84 lines
3.3 KiB
Python

import re
from typing import List, Dict
from .helper import subprocess_readlines
class LineShiftChecker:
DIFF_BLOCK_REGEX = r'@@ -(\d+),(\d+) \+(\d+),(\d+) @@'
def __init__(self, revision_since, revision_until) -> None:
self.revision_since = revision_since
self.revision_until = revision_until
def get_shifted_lines(self) -> Dict[str, Dict]:
shifted_lines = {}
for file_info in self.__get_changed_files():
shifted_lines[file_info['src']] = self.__get_shifted_lines_in_file(file_info)
return shifted_lines
def __get_changed_files(self) -> List[Dict]:
process_output = subprocess_readlines(['git', 'diff', '--name-status', '--diff-filter=MR',
self.revision_since, self.revision_until])
file_list = []
for line in process_output:
raw_file_info = line.split()
file_list.append({
'src': raw_file_info[1],
'dst': raw_file_info[2] if len(raw_file_info) > 2 else raw_file_info[1],
})
return file_list
def __get_shifted_lines_in_file(self, file_info) -> 'Dict[str, str | None]':
process_output = subprocess_readlines(['git', 'diff',
self.revision_since, self.revision_until, '--',
file_info['src'], file_info['dst']])
shifted_lines = {}
src_line_index = 1
dst_line_index = 1
diff_started = False
for line in process_output:
matches = re.search(LineShiftChecker.DIFF_BLOCK_REGEX, line)
if matches:
diff_block_src_start = int(matches.group(1))
diff_block_dst_start = int(matches.group(3))
# fill shifted lines between 2 diff blocks
for i in range(0, diff_block_src_start - src_line_index):
shifted_lines[f'{file_info["src"]}:{src_line_index+i}'] = f'{file_info["dst"]}:{dst_line_index+i}'
src_line_index = diff_block_src_start
dst_line_index = diff_block_dst_start
diff_started = True
continue
if not diff_started:
continue
if line.startswith(' '):
shifted_lines[f'{file_info["src"]}:{src_line_index}'] = f'{file_info["dst"]}:{dst_line_index}'
src_line_index += 1
dst_line_index += 1
elif line.startswith('+'):
dst_line_index += 1
elif line.startswith('-'):
shifted_lines[f'{file_info["src"]}:{src_line_index}'] = None
src_line_index += 1
# fill shifted lines until end of file
lines_in_source_file = self.__count_lines_in_source_file(file_info['src'])
for i in range(0, lines_in_source_file - src_line_index + 1):
shifted_lines[f'{file_info["src"]}:{src_line_index+i}'] = f'{file_info["dst"]}:{dst_line_index+i}'
assert lines_in_source_file == len(shifted_lines)
return shifted_lines
def __count_lines_in_source_file(self, file) -> int:
process_output = subprocess_readlines(['git', 'show', f'{self.revision_since}:{file}'])
return sum(1 for _ in process_output)