|
1 package tidystats; |
|
2 |
|
3 import java.io.IOException; |
|
4 import java.nio.charset.Charset; |
|
5 import java.nio.file.FileSystem; |
|
6 import java.nio.file.FileSystems; |
|
7 import java.nio.file.Files; |
|
8 import java.nio.file.Path; |
|
9 import java.util.ArrayList; |
|
10 import java.util.Comparator; |
|
11 import java.util.HashMap; |
|
12 import java.util.List; |
|
13 import java.util.Map; |
|
14 import java.util.Set; |
|
15 import java.util.TreeMap; |
|
16 import java.util.TreeSet; |
|
17 import java.util.regex.Matcher; |
|
18 import java.util.regex.Pattern; |
|
19 |
|
20 public class Main { |
|
21 public static void main(String... args) throws IOException { |
|
22 new Main().run(args); |
|
23 } |
|
24 |
|
25 void run(String... args) throws IOException { |
|
26 FileSystem fs = FileSystems.getDefault(); |
|
27 List<Path> paths = new ArrayList<>(); |
|
28 |
|
29 int i; |
|
30 for (i = 0; i < args.length; i++) { |
|
31 String arg = args[i]; |
|
32 if (arg.startsWith("-")) |
|
33 throw new IllegalArgumentException(arg); |
|
34 else |
|
35 break; |
|
36 } |
|
37 |
|
38 for ( ; i < args.length; i++) { |
|
39 Path p = fs.getPath(args[i]); |
|
40 paths.add(p); |
|
41 } |
|
42 |
|
43 for (Path p: paths) { |
|
44 scan(p); |
|
45 } |
|
46 |
|
47 print("%6d files read", files); |
|
48 print("%6d files had no errors or warnings", ok); |
|
49 print("%6d files reported \"Not all warnings/errors were shown.\"", overflow); |
|
50 print("%6d errors found", errs); |
|
51 print("%6d warnings found", warns); |
|
52 print("%6d recommendations to use CSS", css); |
|
53 print(""); |
|
54 |
|
55 Map<Integer, Set<String>> sortedCounts = new TreeMap<>( |
|
56 new Comparator<Integer>() { |
|
57 @Override |
|
58 public int compare(Integer o1, Integer o2) { |
|
59 return o2.compareTo(o1); |
|
60 } |
|
61 }); |
|
62 |
|
63 for (Map.Entry<Pattern, Integer> e: counts.entrySet()) { |
|
64 Pattern p = e.getKey(); |
|
65 Integer n = e.getValue(); |
|
66 Set<String> set = sortedCounts.get(n); |
|
67 if (set == null) |
|
68 sortedCounts.put(n, (set = new TreeSet<>())); |
|
69 set.add(p.toString()); |
|
70 } |
|
71 |
|
72 for (Map.Entry<Integer, Set<String>> e: sortedCounts.entrySet()) { |
|
73 for (String p: e.getValue()) { |
|
74 if (p.startsWith(".*")) p = p.substring(2); |
|
75 print("%6d: %s", e.getKey(), p); |
|
76 } |
|
77 } |
|
78 } |
|
79 |
|
80 void scan(Path p) throws IOException { |
|
81 if (Files.isDirectory(p)) { |
|
82 for (Path c: Files.newDirectoryStream(p)) { |
|
83 scan(c); |
|
84 } |
|
85 } else if (isTidyFile(p)) { |
|
86 scan(Files.readAllLines(p, Charset.defaultCharset())); |
|
87 } |
|
88 } |
|
89 |
|
90 boolean isTidyFile(Path p) { |
|
91 return Files.isRegularFile(p) && p.getFileName().toString().endsWith(".tidy"); |
|
92 } |
|
93 |
|
94 void scan(List<String> lines) { |
|
95 Matcher m; |
|
96 files++; |
|
97 for (String line: lines) { |
|
98 if (okPattern.matcher(line).matches()) { |
|
99 ok++; |
|
100 } else if ((m = countPattern.matcher(line)).matches()) { |
|
101 warns += Integer.valueOf(m.group(1)); |
|
102 errs += Integer.valueOf(m.group(2)); |
|
103 if (m.group(3) != null) |
|
104 overflow++; |
|
105 } else if ((m = guardPattern.matcher(line)).matches()) { |
|
106 boolean found = false; |
|
107 for (Pattern p: patterns) { |
|
108 if ((m = p.matcher(line)).matches()) { |
|
109 found = true; |
|
110 count(p); |
|
111 break; |
|
112 } |
|
113 } |
|
114 if (!found) |
|
115 System.err.println("Unrecognized line: " + line); |
|
116 } else if (cssPattern.matcher(line).matches()) { |
|
117 css++; |
|
118 } |
|
119 } |
|
120 } |
|
121 |
|
122 Map<Pattern, Integer> counts = new HashMap<>(); |
|
123 void count(Pattern p) { |
|
124 Integer i = counts.get(p); |
|
125 counts.put(p, (i == null) ? 1 : i + 1); |
|
126 } |
|
127 |
|
128 void print(String format, Object... args) { |
|
129 System.out.println(String.format(format, args)); |
|
130 } |
|
131 |
|
132 Pattern okPattern = Pattern.compile("No warnings or errors were found."); |
|
133 Pattern countPattern = Pattern.compile("([0-9]+) warnings, ([0-9]+) errors were found!.*?(Not all warnings/errors were shown.)?"); |
|
134 Pattern cssPattern = Pattern.compile("You are recommended to use CSS.*"); |
|
135 Pattern guardPattern = Pattern.compile("line [0-9]+ column [0-9]+ - (Error|Warning):.*"); |
|
136 |
|
137 Pattern[] patterns = { |
|
138 Pattern.compile(".*Error: <.*> is not recognized!"), |
|
139 Pattern.compile(".*Error: missing quote mark for attribute value"), |
|
140 Pattern.compile(".*Warning: <.*> anchor \".*\" already defined"), |
|
141 Pattern.compile(".*Warning: <.*> attribute \".*\" has invalid value \".*\""), |
|
142 Pattern.compile(".*Warning: <.*> attribute \".*\" lacks value"), |
|
143 Pattern.compile(".*Warning: <.*> attribute \".*\" lacks value"), |
|
144 Pattern.compile(".*Warning: <.*> attribute with missing trailing quote mark"), |
|
145 Pattern.compile(".*Warning: <.*> dropping value \".*\" for repeated attribute \".*\""), |
|
146 Pattern.compile(".*Warning: <.*> inserting \".*\" attribute"), |
|
147 Pattern.compile(".*Warning: <.*> is probably intended as </.*>"), |
|
148 Pattern.compile(".*Warning: <.*> isn't allowed in <.*> elements"), |
|
149 Pattern.compile(".*Warning: <.*> lacks \".*\" attribute"), |
|
150 Pattern.compile(".*Warning: <.*> missing '>' for end of tag"), |
|
151 Pattern.compile(".*Warning: <.*> proprietary attribute \".*\""), |
|
152 Pattern.compile(".*Warning: <.*> unexpected or duplicate quote mark"), |
|
153 Pattern.compile(".*Warning: <a> cannot copy name attribute to id"), |
|
154 Pattern.compile(".*Warning: <a> escaping malformed URI reference"), |
|
155 Pattern.compile(".*Warning: <blockquote> proprietary attribute \"pre\""), |
|
156 Pattern.compile(".*Warning: discarding unexpected <.*>"), |
|
157 Pattern.compile(".*Warning: discarding unexpected </.*>"), |
|
158 Pattern.compile(".*Warning: entity \".*\" doesn't end in ';'"), |
|
159 Pattern.compile(".*Warning: inserting implicit <.*>"), |
|
160 Pattern.compile(".*Warning: inserting missing 'title' element"), |
|
161 Pattern.compile(".*Warning: missing <!DOCTYPE> declaration"), |
|
162 Pattern.compile(".*Warning: missing <.*>"), |
|
163 Pattern.compile(".*Warning: missing </.*> before <.*>"), |
|
164 Pattern.compile(".*Warning: nested emphasis <.*>"), |
|
165 Pattern.compile(".*Warning: plain text isn't allowed in <.*> elements"), |
|
166 Pattern.compile(".*Warning: replacing <p> by <br>"), |
|
167 Pattern.compile(".*Warning: replacing invalid numeric character reference .*"), |
|
168 Pattern.compile(".*Warning: replacing unexpected .* by </.*>"), |
|
169 Pattern.compile(".*Warning: trimming empty <.*>"), |
|
170 Pattern.compile(".*Warning: unescaped & or unknown entity \".*\""), |
|
171 Pattern.compile(".*Warning: unescaped & which should be written as &"), |
|
172 Pattern.compile(".*Warning: using <br> in place of <p>") |
|
173 }; |
|
174 |
|
175 int files; |
|
176 int ok; |
|
177 int warns; |
|
178 int errs; |
|
179 int css; |
|
180 int overflow; |
|
181 } |
|
182 |