-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrepo_size.py
70 lines (56 loc) · 1.62 KB
/
repo_size.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
from collections import defaultdict
import os
ignore = [
'.DS_Store',
'__pycache__',
'node_modules',
'.git',
'.venv',
'.png',
'.ico',
'.jpg',
'.json',
'pip.lock',
'pnpm-lock.yaml',
'yarn.lock',
'market_data/',
'build/'
]
def check_ignore(path):
return all(x not in path for x in ignore)
def iterate_all_files_recursively(folder_path):
for root, _, files in os.walk(folder_path):
for file in files:
path = os.path.join(root, file)
if check_ignore(path):
yield path
def read_line_count(path):
with open(path, 'r', encoding='utf8') as f:
return sum(1 for line in f)
def read_all_line_counts(files):
counts = []
for f in files:
counts.append(read_line_count(f))
return counts
if __name__ == '__main__':
files = []
for i in iterate_all_files_recursively('.'):
files.append(i)
count = len(files)
line_counts = read_all_line_counts(files)
print(f"File count: {count}")
print(f"Line count: {sum(line_counts)}")
# Calculate folder stats
folderdict = defaultdict({'files': 0, 'lines': 0}.copy)
for i, f in enumerate(files):
parts = f.split('/')
if len(parts) == 2:
folderdict['<root>']['files'] += 1
folderdict['<root>']['lines'] += line_counts[i]
else:
folder = parts[1]
folderdict[folder]['files'] += 1
folderdict[folder]['lines'] += line_counts[i]
print("Folder stats:")
for k, v in folderdict.items():
print(f" {k}: {v['files']} files, {v['lines']} lines")