Specify the encoding, in case it's not the same as the locale. diff -x config.log -x config.status -ru tmp/intel-gpu-tools-1.7/debugger/system_routine/pre_cpp.py work/intel-gpu-tools-1.7/debugger/system_routine/pre_cpp.py --- tmp/intel-gpu-tools-1.7/debugger/system_routine/pre_cpp.py 2014-05-13 13:31:22.000000000 +0100 +++ work/intel-gpu-tools-1.7/debugger/system_routine/pre_cpp.py 2014-06-30 23:16:12.743000000 +0100 @@ -33,7 +33,7 @@ import sys,re -file = open(sys.argv[1], "r") +file = open(sys.argv[1], "r", encoding="UTF-8") lines = file.readlines() len(lines)