File: x2j_bulk.go

package info (click to toggle)
golang-github-clbanning-mxj 2.7.0-1
  • links: PTS, VCS
  • area: main
  • in suites: sid, trixie
  • size: 2,200 kB
  • sloc: xml: 176; makefile: 4
file content (129 lines) | stat: -rw-r--r-- 3,659 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
// Copyright 2012-2018 Charles Banning. All rights reserved.
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file

//	x2j_bulk.go: Process files with multiple XML messages.
// Extends x2m_bulk.go to work with JSON strings rather than map[string]interface{}.

package x2j

import (
	"bytes"
	"io"
	"os"
	"regexp"

	"github.com/clbanning/mxj/v2"
)

// XmlMsgsFromFileAsJson()
//	'fname' is name of file
//	'phandler' is the JSON string processing handler. Return of 'false' stops further processing.
//	'ehandler' is the parsing error handler. Return of 'false' stops further processing and returns error.
//	Note: phandler() and ehandler() calls are blocking, so reading and processing of messages is serialized.
//	      This means that you can stop reading the file on error or after processing a particular message.
//	      To have reading and handling run concurrently, pass arguments to a go routine in handler and return true.
func XmlMsgsFromFileAsJson(fname string, phandler func(string)(bool), ehandler func(error)(bool), recast ...bool) error {
	var r bool
	if len(recast) == 1 {
		r = recast[0]
	}
	fi, fierr := os.Stat(fname)
	if fierr != nil {
		return fierr
	}
	fh, fherr := os.Open(fname)
	if fherr != nil {
		return fherr
	}
	defer fh.Close()
	buf := make([]byte,fi.Size())
	_, rerr  :=  fh.Read(buf)
	if rerr != nil {
		return rerr
	}
	doc := string(buf)

	// xml.Decoder doesn't properly handle whitespace in some doc
	// see songTextString.xml test case ... 
	reg,_ := regexp.Compile("[ \t\n\r]*<")
	doc = reg.ReplaceAllString(doc,"<")
	b := bytes.NewBufferString(doc)

	for {
		s, serr := XmlBufferToJson(b,r)
		if serr != nil && serr != io.EOF {
			if ok := ehandler(serr); !ok {
				// caused reader termination
				return serr
			 }
		}
		if s != "" {
			if ok := phandler(s); !ok {
				break
			}
		}
		if serr == io.EOF {
			break
		}
	}
	return nil
}

// XmlBufferToJson - process XML message from a bytes.Buffer
//	'b' is the buffer
//	Optional argument 'recast' coerces values to float64 or bool where possible.
func XmlBufferToJson(b *bytes.Buffer,recast ...bool) (string,error) {
	var r bool
	if len(recast) == 1 {
		r = recast[0]
	}

	m, err := mxj.NewMapXmlReader(b, r)
	// n,err := XmlBufferToTree(b)
	if err != nil {
		return "", err
	}

	// m := make(map[string]interface{})
	// m[n.key] = n.treeToMap(r)

	j, jerr := m.Json()
	return string(j), jerr
}

// =============================  io.Reader version for stream processing  ======================

// XmlMsgsFromReaderAsJson() - io.Reader version of XmlMsgsFromFileAsJson
//	'rdr' is an io.Reader for an XML message (stream)
//	'phandler' is the JSON string processing handler. Return of 'false' stops further processing.
//	'ehandler' is the parsing error handler. Return of 'false' stops further processing and returns error.
//	Note: phandler() and ehandler() calls are blocking, so reading and processing of messages is serialized.
//	      This means that you can stop reading the file on error or after processing a particular message.
//	      To have reading and handling run concurrently, pass arguments to a go routine in handler and return true.
func XmlMsgsFromReaderAsJson(rdr io.Reader, phandler func(string)(bool), ehandler func(error)(bool), recast ...bool) error {
	var r bool
	if len(recast) == 1 {
		r = recast[0]
	}

	for {
		s, serr := ToJson(rdr,r)
		if serr != nil && serr != io.EOF {
			if ok := ehandler(serr); !ok {
				// caused reader termination
				return serr
			 }
		}
		if s != "" {
			if ok := phandler(s); !ok {
				break
			}
		}
		if serr == io.EOF {
			break
		}
	}
	return nil
}