/usr/share/idzebra-2.0/tab/nwi.flt is in idzebra-2.0-common 2.0.59-1ubuntu1.
This file is owned by root:root, with mode 0o644.
The actual contents of the file can be viewed below.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 | #
# Input-filter for the Nordic Web Index record syntax. Output is 'gils-like'.
#
#
/<nwi>/ { begin record gils }
# Ignore meta tags
/<meta.*>.*$/ {}
/<ti> */ BODY /$/ { data -element title $1 }
/<dm> */ BODY /$/ { data -element dateOfLastModification $1 }
/<ci> */ BODY /$/ { data -element controlIdentifier $1 }
/<si>/ { begin element supplementalInformation }
/<lc> */ BODY /$/ { data -element lastChecked $1 }
/<by> */ BODY /$/ { data -element bytes $1 }
/<av>/ { begin element availability }
/<avli> */ BODY /$/ { data -element linkage $1 }
/<ty> */ BODY /$/ { data -element linkageType $1 }
/<lsi>/ { begin element localSubjectIndex }
/<dh> */ BODY /$/ { data -element localSubjectTerm $1 }
# Don't want to have <ip> inside of LocalSubjectIndex
# Since we end localsubjectindex, we consume the end-tag for that as well.
#/<ip>[ \n]*/ BODY /<\/ip>[ \n]*<\/lsi>/ {
# end element;
# data -element sampleText $1
# }
/<ip>[ \n]*/ BODY /<\/ip>/ {
end element;
data -element sampleText $1
}
/<cr>/ { begin element crossReference }
/<li> */ BODY /$/ { data -element linkage $1 }
/<cp> */ BODY /$/ { data -element title $1 }
/<\/nwi>/ { end record }
# Generic end-marker
/<\/[^>]*>/ { end element }
/\n/ { }
/./ {}
|