diff options
author | Arno Teigseth <arno@teigseth.no> | 2011-02-05 08:48:27 +0000 |
---|---|---|
committer | Arno Teigseth <arno@teigseth.no> | 2011-02-05 08:48:27 +0000 |
commit | 4f3d565a5e5ede6eb6fd1f276d4e8ad37b67b5ce (patch) | |
tree | 7af736540eca93034428a975bd850e709fbbe2e5 /JLanguageTool/src/dev/tools/stats.awk | |
parent | ecaee85ab5984ebadd56721c295dc26b3335f7ce (diff) | |
download | grammar-norwegian-master.tar.gz grammar-norwegian-master.tar.bz2 grammar-norwegian-master.tar.xz |
Diffstat (limited to 'JLanguageTool/src/dev/tools/stats.awk')
-rw-r--r-- | JLanguageTool/src/dev/tools/stats.awk | 62 |
1 files changed, 62 insertions, 0 deletions
diff --git a/JLanguageTool/src/dev/tools/stats.awk b/JLanguageTool/src/dev/tools/stats.awk new file mode 100644 index 0000000..aa1760e --- /dev/null +++ b/JLanguageTool/src/dev/tools/stats.awk @@ -0,0 +1,62 @@ +#Script to sort rule matches from LanguageTool +#Usage: gawk -f stats.awk <file_created_by_LanguageTool> +#(c) 2008, Marcin Milkowski +# This library is free software; you can redistribute it and/or +# modify it under the terms of the GNU Lesser General Public +# License as published by the Free Software Foundation; either +# version 2.1 of the License, or (at your option) any later version. +# +# This library is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU +# Lesser General Public License for more details. +# +# You should have received a copy of the GNU Lesser General Public +# License along with this library; if not, write to the Free Software +# Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 +# USA + +/^[0-9]+\.\)/ { +gsub(/^.*ID: /,"") +rule_cnt[$0]++ +current_rule=$0 +rulematch=1 +linecnt=0 +} +/^(Message: |Suggestion:)/ { +comments[current_rule]= comments[current_rule] "\n" $0 +linecnt++ +} +!/^($|Message: |Suggestion:|Time:)/ && !/ \^/ { +if (linecnt>0) +comments[current_rule]= comments[current_rule] "\n" $0 +} +/^ / && / \^/ { +comments[current_rule]= comments[current_rule] "\n" $0 "\n" +} +END { +if (rulematch==1) { +print "LanguageTool rule matches in descending order" +print "=============================================" +print "" +} +z = asorti(rule_cnt, rule_names) +#for (i = 1; i <= z; i++) + # print i " " rule_names[i] +n = asort(rule_cnt, rules) + +for (i = z; i >= 1; i--) { + + for (j = 1; j <= z; j++) { +# print j " " rule_names[j] " => " rule_cnt[rule_names[j]] + if (rule_cnt[rule_names[j]]==rules[i] \ + && printed[rule_names[j]]!="done") { + printed[rule_names[j]]="done" + rule=rule_names[j] + print "Rule ID: " rule ", matches: " rule_cnt[rule] + print comments[rule] + print "=============" + } + } +} +}
\ No newline at end of file |