-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmetagopenoffice.go
101 lines (92 loc) · 3.05 KB
/
metagopenoffice.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
/*
Licensed to the Apache Software Foundation (ASF) under one
or more contributor license agreements. See the NOTICE file
distributed with this work for additional information
regarding copyright ownership. The ASF licenses this file
to you under the Apache License, Version 2.0 (the
"License"); you may not use this file except in compliance
with the License. You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing,
software distributed under the License is distributed on an
"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
KIND, either express or implied. See the License for the
specific language governing permissions and limitations
under the License.
*/
package metagopenoffice
import (
"archive/zip"
"bufio"
"encoding/xml"
"errors"
"os"
"strings"
)
//Statistics is a struct that contains the document-statistics
type Statistics struct {
PageCount int `xml:"page-count,attr"`
ImageCount int `xml:"image-count,attr"`
ObjectCount int `xml:"object-count,attr"`
ParagraphCount int `xml:"paragraph-count,attr"`
WordCount int `xml:"word-count,attr"`
CharCount int `xml:"character-count,attr"`
}
//Metadata is a struct that contains metadata fields
type Metadata struct {
Generator string `xml:"generator"`
Title string `xml:"title"`
Description string `xml:"description"`
Subject string `xml:"subject"`
PrintDate string `xml:"print-date"`
Keyword string `xml:"keyword"`
InitialCreator string `xml:"initial-creator"`
CreationDate string `xml:"creation-date"`
Creator string `xml:"creator"`
Date string `xml:"date"`
Language string `xml:"language"`
EditingCycles string `xml:"editing-cycles"`
EditingDuration string `xml:"editing-duration"`
Stats Statistics `xml:"document-statistic"`
}
//OpenOfficeXML contains the fields of te file meta.xml
type OpenOfficeXML struct {
Meta Metadata `xml:"meta"`
}
//GetMetada function
func GetMetada(document *os.File) (metadata OpenOfficeXML, err error) {
fileName := document.Name()
dot := strings.LastIndex(fileName, ".")
after := fileName[:dot] + ".zip"
err = os.Rename(fileName, after)
if err != nil {
return metadata, errors.New("Failed to rename as .zip")
}
read, err := zip.OpenReader(after)
if err != nil {
os.Rename(after, fileName)
return metadata, errors.New("Failed to open the file")
}
var xmlFile string
for _, file := range read.File {
if file.Name == "meta.xml" {
rc, err := file.Open()
scanner := bufio.NewScanner(rc)
for scanner.Scan() {
xmlFile += scanner.Text()
}
if err != nil {
os.Rename(after, fileName)
return metadata, errors.New("Failed to open meta.xml")
}
defer rc.Close()
}
}
if err := xml.Unmarshal([]byte(xmlFile), &metadata); err != nil {
os.Rename(after, fileName)
return metadata, errors.New("Failed to Unmarshal")
}
read.Close()
os.Rename(after, fileName)
return metadata, err
}