=================================================================== RCS file: /cvs/docbook2mdoc/statistics.c,v retrieving revision 1.3 retrieving revision 1.4 diff -u -p -r1.3 -r1.4 --- docbook2mdoc/statistics.c 2019/04/03 08:39:53 1.3 +++ docbook2mdoc/statistics.c 2019/04/03 09:49:49 1.4 @@ -1,4 +1,4 @@ -/* $Id: statistics.c,v 1.3 2019/04/03 08:39:53 schwarze Exp $ */ +/* $Id: statistics.c,v 1.4 2019/04/03 09:49:49 schwarze Exp $ */ /* * Copyright (c) 2019 Ingo Schwarze * @@ -36,6 +36,16 @@ * Typical usage: * statistics < filenames.txt | sort -n * statistics < filenames.txt | grep '\' | sort -n + * + * Relations already fully implemented are excluded by default. + * The option -a shows all relations. + * + * If two arguments (parent and child) are given, a histogram + * of the number of children of the kind in each parent is given + * in addition to the normal output. + * + * Example usage: + * statistics tgroup colspec < filenames.txt | grep colspec */ struct entry { @@ -52,7 +62,18 @@ static char **stack; static size_t stacksz; static size_t stacki; +static const int nchildsz = 8; +struct nchild { + char *parent; + char *child; + int freq[nchildsz]; + int count; +}; +static struct nchild nchild; +static char *fname; + + /* * Count one instance of a parent-child relation. * Before the special call table_add(NULL, NULL), @@ -70,6 +91,21 @@ table_add(const char *parent, const char *child) return; } + /* Optional parent-child histogram. */ + + if (init_done && parent != NULL && child != NULL && + nchild.parent != NULL && nchild.child != NULL && + strcmp(parent, nchild.parent) == 0 && + strcmp(child, nchild.child) == 0) { + if (nchild.count < nchildsz) { + nchild.freq[nchild.count]++; + if (nchild.count > 0) + nchild.freq[nchild.count - 1]--; + } else if (nchild.count == nchildsz) + puts(fname); + nchild.count++; + } + /* If the table entry already exists, increment its count. */ for (i = 0; i < tablei; i++) { @@ -109,6 +145,9 @@ table_add(const char *parent, const char *child) static void stack_push(const char *name) { + if (nchild.parent != NULL && strcmp(name, nchild.parent) == 0) + nchild.count = 0; + if (stacki == stacksz) { stacksz += 8; stack = reallocarray(stack, stacksz, sizeof(*stack)); @@ -283,7 +322,6 @@ parse_file(int fd, char *fname) int main(int argc, char *argv[]) { - char *fname; size_t fsz, i; ssize_t rsz; int ch, fd, show_all; @@ -298,7 +336,14 @@ main(int argc, char *argv[]) return 1; } } + argc -= optind; + argv += optind; + if (argc > 1) { + nchild.parent = argv[0]; + nchild.child = argv[1]; + } + /* Exclude relations that are already fully implemented. */ if (show_all == 0) { table_add("para", NULL); @@ -329,5 +374,13 @@ main(int argc, char *argv[]) if (table[i].count != -1) printf("%d\t%s\t%s\n", table[i].count, table[i].parent, table[i].child); + + /* Optional parent-child histogram. */ + if (nchild.parent != NULL) { + printf("%s %s", nchild.parent, nchild.child); + for (i = 0; i < nchildsz; i++) + printf(" %d", nchild.freq[i]); + putchar('\n'); + } return 0; }