git hyper-blame: Fix tabulation of Unicode characters in author name. Previously, it counted the number of UTF-8 bytes when spacing out the table, not the number of code points. Bug: 808905 Change-Id: Ice5504089e0f7097e108c6dfbbb810620b9dfc94 Reviewed-on: https://chromium-review.googlesource.com/901142 Commit-Queue: Matt Giuca <mgiuca@chromium.org> Reviewed-by: Robbie Iannucci <iannucci@chromium.org>

commit: a148b5ee55b107b0ad99b0ea69060b6609d97656 [log] [tgz]
author: Matt Giuca <mgiuca@chromium.org> Wed Feb 07 13:24:50 2018 +1100
committer: Commit Bot <commit-bot@chromium.org> Mon Feb 12 23:28:47 2018 +0000
tree: 7a629e8a468d4e9213aca62bdada5ec7d2ab654f
parent: 63560ada2d710e8eb27027779650f40ab71ac6ab [diff] [blame]
diff --git a/git_hyper_blame.py b/git_hyper_blame.py
index b24df5f..3e08513 100755
--- a/git_hyper_blame.py
+++ b/git_hyper_blame.py

@@ -94,6 +94,11 @@
     yield BlameLine(commit, context, lineno_then, lineno_now, False)
 
 
+def num_codepoints(s):
+  """Gets the length of a UTF-8 byte string, in Unicode codepoints."""
+  return len(s.decode('utf-8', errors='replace'))
+
+
 def print_table(table, colsep=' ', rowsep='\n', align=None, out=sys.stdout):
   """Print a 2D rectangular array, aligning columns with spaces.
 
@@ -107,9 +112,10 @@
   colwidths = None
   for row in table:
     if colwidths is None:
-      colwidths = [len(x) for x in row]
+      colwidths = [num_codepoints(x) for x in row]
     else:
-      colwidths = [max(colwidths[i], len(x)) for i, x in enumerate(row)]
+      colwidths = [max(colwidths[i], num_codepoints(x))
+                   for i, x in enumerate(row)]
 
   if align is None:  # pragma: no cover
     align = 'l' * len(colwidths)
@@ -117,7 +123,7 @@
   for row in table:
     cells = []
     for i, cell in enumerate(row):
-      padding = ' ' * (colwidths[i] - len(cell))
+      padding = ' ' * (colwidths[i] - num_codepoints(cell))
       if align[i] == 'r':
         cell = padding + cell
       elif i < len(row) - 1:
commit	a148b5ee55b107b0ad99b0ea69060b6609d97656	[log] [tgz]
author	Matt Giuca <mgiuca@chromium.org>	Wed Feb 07 13:24:50 2018 +1100
committer	Commit Bot <commit-bot@chromium.org>	Mon Feb 12 23:28:47 2018 +0000
tree	7a629e8a468d4e9213aca62bdada5ec7d2ab654f
parent	63560ada2d710e8eb27027779650f40ab71ac6ab [diff] [blame]