aboutsummaryrefslogtreecommitdiff
path: root/tabsvsspaces
diff options
context:
space:
mode:
authorRoman Gräf <romangraef@loves.dicksinhisan.us>2020-06-21 02:44:37 +0200
committerRoman Gräf <romangraef@loves.dicksinhisan.us>2020-06-21 02:44:37 +0200
commit04684f0b25c924d6d88a0be7f7fb0d3368de406f (patch)
tree062f14b0a987275390dab58605f8ca2dea74361c /tabsvsspaces
parent090b44edd8bf42e3d9574680dfa2e27cae8e595e (diff)
downloadtabsvsspaces-master.tar.gz
tabsvsspaces-master.tar.bz2
tabsvsspaces-master.zip
pypi releaseHEADmaster
Diffstat (limited to 'tabsvsspaces')
-rw-r--r--tabsvsspaces/find_stats.py63
1 files changed, 63 insertions, 0 deletions
diff --git a/tabsvsspaces/find_stats.py b/tabsvsspaces/find_stats.py
new file mode 100644
index 0000000..d72385e
--- /dev/null
+++ b/tabsvsspaces/find_stats.py
@@ -0,0 +1,63 @@
+import os
+from pathlib import Path
+
+from .stats import Statistics
+
+IGNORED_FOLDERS = [
+ 'venv',
+ 'build',
+ 'dist',
+ 'generated',
+ 'generated-src',
+]
+
+
+def find_all_files(folder: Path, verbose: bool = False):
+ def gen():
+ for subpath, subfolders, filenames in os.walk(str(folder)):
+ subfolders[:] = [subfolder for subfolder in subfolders if
+ not (subfolder.startswith('.') or subfolder.lower() in IGNORED_FOLDERS)]
+ current_path = Path(subpath)
+ for file in filenames:
+ file_path = current_path / file
+ if not file.startswith('.'):
+ yield file_path
+ if verbose:
+ print('Scanning', file_path)
+ else:
+ if verbose:
+ print('Skipping', file_path)
+
+ return list(gen())
+
+
+def find_stats_for_file(filename: Path, name: str, stats: Statistics):
+ extension = filename.name.split('.')[-1]
+ try:
+ for line in filename.read_text().split('\n'):
+ spaces = False
+ tabs = False
+ while len(line) > 0 and line[0] in [' ', '\t']:
+ if line[0] == ' ':
+ spaces = True
+ if line[0] == '\t':
+ tabs = True
+ line = line[1:]
+ if spaces and tabs:
+ stats.add_mixed_line(extension=extension,
+ filename=name)
+ elif spaces:
+ stats.add_spaces(extension=extension)
+ elif tabs:
+ stats.add_tabs(extension=extension)
+ except (UnicodeDecodeError, OSError):
+ pass
+
+
+def find_stats(folder: Path, verbose: bool = False) -> Statistics:
+ folder = folder.resolve()
+ files = find_all_files(folder, verbose=verbose)
+ stats = Statistics()
+ for file in files:
+ find_stats_for_file(folder / file, file, stats)
+ return stats