gitinspector/blame.py
Adam Waldenberg 494679520f Enabled threading in the blame module and removed the system module.
To accommodate this modification, the changing of working directory (when
a repository is specified) has been moved from the system module to the
main gitinspector module. This enables us to change directory in one go
when gitinspector starts, thus removing the need for the previous system
module.
2012-05-20 22:02:08 +02:00

128 lines
3.8 KiB
Python

# coding: utf-8
#
# Copyright © 2012 Ejwa Software. All rights reserved.
#
# This file is part of gitinspector.
#
# gitinspector is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# gitinspector is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with gitinspector. If not, see <http://www.gnu.org/licenses/>.
from changes import FileDiff
import comment
import missing
import multiprocessing
import os
import re
import sys
import terminal
import threading
class BlameEntry:
rows = 0
comments = 0
__thread_lock__ = threading.BoundedSemaphore(multiprocessing.cpu_count())
__blame_lock__ = threading.Lock()
class BlameThread(threading.Thread):
def __init__(self, blame_string, extension, blames):
__thread_lock__.acquire() # Lock controlling the number of threads running
threading.Thread.__init__(self)
self.blame_string = blame_string
self.extension = extension
self.blames = blames
def run(self):
git_blame_r = os.popen(self.blame_string)
is_inside_comment = False
for j in git_blame_r.readlines():
if Blame.is_blame_line(j):
author = Blame.get_author(j)
content = Blame.get_content(j)
__blame_lock__.acquire() # Global lock used to protect calls from here...
if self.blames.get(author, None) == None:
self.blames[author] = BlameEntry()
if comment.is_comment(self.extension, content):
self.blames[author].comments += 1
if is_inside_comment:
if comment.has_comment_end(self.extension, content):
is_inside_comment = False
else:
self.blames[author].comments += 1
elif comment.has_comment_begining(self.extension, content):
is_inside_comment = True
self.blames[author].rows += 1
__blame_lock__.release() # ...to here.
__thread_lock__.release() # Lock controlling the number of threads running
class Blame:
def __init__(self, hard):
self.blames = {}
ls_tree_r = os.popen("git ls-tree --name-only -r HEAD")
lines = ls_tree_r.readlines()
for i, row in enumerate(lines):
if FileDiff.is_valid_extension(row):
if not missing.add(row.strip()):
blame_string = "git blame -w {0} \"".format("-C -C -M" if hard else "") + row.strip() + "\""
thread = BlameThread(blame_string, FileDiff.get_extension(row), self.blames)
thread.start()
if hard:
Blame.output_progress(i, len(lines))
# Make sure all threads have completed.
for i in range(0, multiprocessing.cpu_count()):
__thread_lock__.acquire()
@staticmethod
def output_progress(pos, length):
if sys.stdout.isatty():
terminal.clear_row()
print "\bChecking how many rows belong to each author (Progress): " + str(100 * pos / length) + "%",
sys.stdout.flush()
@staticmethod
def is_blame_line(string):
return string.find(" (") != -1
@staticmethod
def get_author(string):
author = re.search(" \((.*?)\d\d\d\d-\d\d-\d\d", string)
return re.sub("[^\w ]", "", author.group(1)).strip()
@staticmethod
def get_content(string):
content = re.search(" \d+\)(.*)", string)
return content.group(1).lstrip()
def output(hard):
print ""
blame = Blame(hard)
if hard:
terminal.clear_row()
print "\bBelow is the number of rows from each author that have survived and"
print "are still intact in the current revision:\n"
terminal.printb("Author".ljust(21) + "Rows".rjust(10) + "% in comments".rjust(16))
for i in sorted(blame.blames.items()):
print i[0].ljust(20)[0:20],
print str(i[1].rows).rjust(10),
print "{0:.2f}".format(100.0 * i[1].comments / i[1].rows).rjust(15)