-
Notifications
You must be signed in to change notification settings - Fork 43
/
crawl_result_x_object.go
61 lines (50 loc) · 1.13 KB
/
crawl_result_x_object.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
package pdft
import (
"bytes"
"fmt"
"regexp"
"strconv"
"strings"
)
type crawlResultXObjects []crawlResultXObject
var regSplit = regexp.MustCompile("([a-z A-Z]*)([0-9]*)")
func (c *crawlResultXObjects) parse(propVal *[]byte) error {
var props PDFObjPropertiesData
err := readProperties(propVal, &props)
if err != nil {
return err
}
for _, prop := range props {
//fmt.Printf("\t %#v\n", prop)
tokens := regSplit.FindStringSubmatch(prop.key)
if len(tokens) < 3 {
continue
}
var xObj crawlResultXObject
xObj.xObjChar = tokens[1]
xObjIndex, err := strconv.Atoi(strings.TrimSpace(tokens[2]))
if err != nil {
return err
}
xObj.xObjIndex = xObjIndex
xObjObjID, _, err := readObjIDFromDictionary(prop.rawVal)
if err != nil {
return err
}
xObj.xObjObjID = xObjObjID
*c = append(*c, xObj)
}
return nil
}
func (c *crawlResultXObjects) String() string {
var buff bytes.Buffer
for _, xObj := range *c {
buff.WriteString(fmt.Sprintf("/%s%d %d 0 R", xObj.xObjChar, xObj.xObjIndex, xObj.xObjObjID))
}
return buff.String()
}
type crawlResultXObject struct {
xObjChar string
xObjIndex int
xObjObjID int
}