#!/bin/sh -
#
# Script to extract tables from the PKCS #11 specification and format
# them as YAML comment blocks.
#
# This isn't even half-assed, more like quarter-assed. If I thought
# we'd be using it a lot I'd rewrite it in Python.
#
# Author: Rob Austein
# Copyright (c) 2015, SUNET
#
# Redistribution and use in source and binary forms, with or
# without modification, are permitted provided that the following
# conditions are met:
#
# 1. Redistributions of source code must retain the above copyright
# notice, this list of conditions and the following disclaimer.
#
# 2. Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in
# the documentation and/or other materials provided with the
# distribution.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
# COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
# BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
# STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
# ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
url=http://www.cryptsoft.com/pkcs11doc/download/pkcs11doc-v230.tgz
tar=${url##*/}
test -r $tar ||
wget $url ||
exit
tar -tf $tar |
awk '
/group__SEC__(9|11)__.*\.html/ {
n = split($0, a, "[/.]");
title = a[n-1];
n = split($0, a, /__/);
s1 = a[3];
s2 = (a[4] ~ /^[0-9]+$/) ? a[4] : 0;
s3 = (a[5] ~ /^[0-9]+$/) ? a[5] : 0;
idx = sprintf("%04d%04d%04d", s1, s2, s3);
print idx, $0, title;
}
' |
sort -n |
while read idx fn title
do
tar -xOf $tar $fn |
w3m -dump -O us-ascii -T text/html |
awk -v title=$title '
BEGIN {
print "";
print "###";
print "#", title;
print "###";
print "";
}
/^[|+]/ {
print "#", $0;
}
'
done