summaryrefslogtreecommitdiff
path: root/goencxml.go
blob: 35ddf5c90cc71042067d0e475fd315e3c1436347 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
package main

import (
	"bufio"
	"bytes"
	"encoding/xml"
	"fmt"
	"io"
	"os"
)

func process(r *bufio.Reader) {
	var (
		intitle       bool
		inarticlemeta bool
		buffer        bytes.Buffer
	)

	dec := xml.NewDecoder(r)
	for {
		token, err := dec.Token()
		if err == io.EOF {
			break
		}
		if err != nil {
			fmt.Fprintf(os.Stderr, "Error when decoding XML file %q\n", err)
			os.Exit(1)
		}
		switch t := token.(type) {
		case xml.StartElement:
			if t.Name.Local == "article-meta" {
				inarticlemeta = true
				continue
			}
			if t.Name.Local == "article-title" && inarticlemeta {
				intitle = true
			}
		case xml.CharData:
			if !intitle || !inarticlemeta {
				continue
			}
			buffer.Write(t)
		case xml.EndElement:
			if t.Name.Local == "article-meta" {
				inarticlemeta = false
				continue
			}
			if t.Name.Local == "article-title" && inarticlemeta {
				intitle = false
				fmt.Printf("article-title: %s\n", buffer.String())
				buffer.Reset()
			}
		}
	}
}

func main() {
	for _, arg := range os.Args[1:] {
		file, err := os.Open(arg)
		if err != nil {
			fmt.Fprintf(os.Stderr, "Error when opening file %q\n", arg)
			os.Exit(1)
		}

		r := bufio.NewReader(file)
		process(r)
		file.Close()
	}
}