Version 2.0.50
[idzebra-moved-to-github.git] / tab / nwi.flt
1 #
2 # Input-filter for the Nordic Web Index record syntax. Output is 'gils-like'.
3 #
4 #
5
6 /<nwi>/                            { begin record gils }
7
8 # Ignore meta tags
9
10 /<meta.*>.*$/                    {}
11
12 /<ti> */ BODY /$/                  { data -element title $1 }
13
14 /<dm> */  BODY /$/                  { data -element dateOfLastModification $1 }
15
16 /<ci> */ BODY /$/                  { data -element controlIdentifier $1 }
17
18 /<si>/                           { begin element supplementalInformation }
19 /<lc> */ BODY /$/                  { data -element lastChecked $1 }
20 /<by> */ BODY /$/                  { data -element bytes $1 }
21
22 /<av>/                           { begin element availability }
23 /<avli> */ BODY /$/                { data -element linkage $1 }
24 /<ty> */ BODY /$/                  { data -element linkageType $1 }
25
26 /<lsi>/                          { begin element localSubjectIndex }
27 /<dh> */ BODY /$/                  { data -element localSubjectTerm $1 }
28
29 # Don't want to have <ip> inside of LocalSubjectIndex
30 # Since we end localsubjectindex, we consume the end-tag for that as well.
31
32 #/<ip>[ \n]*/ BODY /<\/ip>[ \n]*<\/lsi>/  {
33 #                                   end element;
34 #                                   data -element sampleText $1
35 #                                }
36
37 /<ip>[ \n]*/ BODY /<\/ip>/       {
38                                    end element;
39                                    data -element sampleText $1
40                                  }
41
42 /<cr>/                           { begin element crossReference }
43 /<li> */ BODY /$/                  { data -element linkage $1 }
44 /<cp> */ BODY /$/                  { data -element title $1 }
45
46 /<\/nwi>/                        { end record }
47
48 # Generic end-marker
49
50 /<\/[^>]*>/                      { end element }
51 /\n/                             { }
52 /./ {}