X-Git-Url: https://pintos-os.org/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=parse-all-xml;h=a91f68eab6a4e95ca8f1e85b9d3d0c7146ca9654;hb=7674958d6669183799289f701e1148b6903b801a;hp=98a4258ddbd50c36bbc47fbca083df5491837844;hpb=0f833bb108ef5a1d78be8ee31b2fe2855f6bd03b;p=pspp diff --git a/parse-all-xml b/parse-all-xml index 98a4258ddb..a91f68eab6 100755 --- a/parse-all-xml +++ b/parse-all-xml @@ -1,5 +1,22 @@ #! /bin/sh -for d in `ls -1 unzipped/*/*.xml |grep -vE 'notes|table|warning|chart|model'` -do - ./parse-xml $d -done | sort -u + +# Parse the structure members that do not represent models or graphs +# and that are not page setups (which are always the first structure member). +# Also skip those with borderProperties, which indicate the non-"light" +# format. +lightTables=`ls -1 unzipped/*/*.xml |grep -vE 'notes|table|warning|chart|model' \ + | xargs grep -EL '<([a-z]*:)?(model|graph|pageSetup|borderProperties)'` +printf 'Structure:\n' +for d in $lightTables; do + ./parse-xml $d containment +done | sort | uniq -c | sort -rn + +printf '\nAttributes:\n' +for d in $lightTables; do + ./parse-xml $d attributes +done | sort | uniq -c | sort -rn + +printf '\nLabels:\n' +for d in $lightTables; do + ./parse-xml $d labels +done | sort | uniq -c | sort -rn