source: people/peter.buschman/backup_monitoring/parsing/parsers/nbstlutil/_nbstlutil.py@ 1102

Last change on this file since 1102 was 976, checked in by peter, on Dec 6, 2011 at 10:19:33 AM

Raw checkin of current NetBackup / TSM parsing code.

File size: 7.4 KB
Line 
1import re
2
3import time
4import datetime
5import pytz
6
7from ....builtins import *
8
9from ...exceptions import *
10from ...expressions import *
11from ...autotype import *
12from ...streams import *
13
14##
15## nbstlutil -U records begin with the string "Image:" on a line by itself
16##
17def stream(stream, format='nbstlutil list -U'):
18
19 if format in ['nbstlutil list -U']:
20 return LineSeparatorStream(stream, separator='Image:', header=1)
21 else:
22 raise ParseError, 'Unknown format %s' % (format)
23
24
25##
26## Parse a nbstlutil record
27##
28def parse(record, format='nbstlutil list -U', version=None, tz=None):
29
30 re_pair = re.compile('^\s*([^:]+):\s*(.*)\s*$')
31 re_type_id = re.compile('^([0-9a-zA-Z\-_ ]+)\s+\((\d+)\)$')
32 re_id_type = re.compile('^(\d+)\s+\(([0-9a-zA-Z\-_ ]+)\)$')
33 re_in_parens = re.compile('^\((.*)\)$')
34 re_starts_with_time = re.compile('^time_.*$')
35 re_ends_with_time = re.compile('^.*_time$')
36 re_time_plus_epoch_seconds_in_parens = re.compile('^.*\d:\d\d:\d\d.*\((\d+)\)$')
37 re_epoch_seconds_plus_time_in_parens = re.compile('^(\d+)\s+\(.*\d:\d\d:\d\d.*\)$')
38
39 image = ExtendedDict()
40
41 if format == 'nbstlutil list -U':
42
43 header = True
44
45 try:
46
47 i = 0
48
49 #
50 # process image header
51 #
52 while header and i < len(record):
53
54 line = record[i]
55
56 i += 1
57
58 #
59 # skip blank lines
60 #
61 if line == '':
62 continue
63
64 match = re_pair.match(line)
65
66 key = match.group(1)
67 value = match.group(2)
68 key = key.lower()
69 key = key.rstrip()
70 key = key.replace('-', '_')
71 key = key.replace(' ', '_')
72
73 if key == 'copy':
74 header = False
75 else:
76
77 #
78 # convert text values to python datatypes
79 #
80 while True:
81
82 #
83 # key name starts with time_ or ends with _time
84 #
85 if re_ends_with_time.match(key) or re_starts_with_time.match(key):
86
87 match = re_epoch_seconds_plus_time_in_parens.match(value)
88 if match:
89 value = datetime.datetime.fromtimestamp(float(match.group(1)), tz)
90 break
91
92 match = re_time_plus_epoch_seconds_in_parens.match(value)
93 if match:
94 value = datetime.datetime.fromtimestamp(float(match.group(1)), tz)
95 break
96
97 #
98 # separate id and type
99 #
100 match = re_id_type.match(value)
101 if match:
102 idkey = '%s_id' % (key)
103 value = match.group(2)
104 image[idkey] = int(match.group(1))
105 break
106
107 #
108 # strip enclosing parens
109 #
110 match = re_in_parens.match(value)
111 if match:
112 value = match.group(1)
113 break
114
115 #
116 # separate type and id
117 #
118 match = re_type_id.match(value)
119 if match:
120 idkey = '%s_id' % (key)
121 value = match.group(1)
122 image[idkey] = int(match.group(2))
123 break
124
125 #
126 # ..otherwise autodetect and break if no datatype conversion was possible
127 #
128 value = autotype(value)
129 break
130
131 #
132 # store value
133 #
134 image[key] = value
135
136 #
137 # parse image copies
138 #
139 copies = ExtendedDict()
140 fragment = False
141
142 while i < len(record):
143
144 line = record[i]
145
146 i += 1
147
148 #
149 # skip blank lines
150 #
151 if line == '':
152 continue
153
154 match = re_pair.match(line)
155
156 key = match.group(1)
157 value = match.group(2)
158 key = key.lower()
159 key = key.rstrip()
160 key = key.replace('-', '_')
161 key = key.replace(' ', '_')
162
163 if key == 'copy':
164 fragment = False
165
166 if key == 'fragment':
167 fragment = True
168#
169# #
170# # identify current copy
171# #
172# if key == 'copy_number':
173#
174# copy_number = int(value)
175#
176# if copy_number not in copies:
177# copies[copy_number] = ExtendedDict()
178# copies[copy_number]['copy_number'] = copy_number
179# copies[copy_number]['fragments'] = ExtendedDict()
180#
181# #
182# # identify current fragment
183# #
184# elif key == 'fragment':
185#
186# if value == 'TIR (-1)':
187# fragment = -1
188# elif value == 'TIR (-2)':
189# fragment = -2
190# else:
191# fragment = int(value)
192#
193# if fragment not in copies[copy_number].fragments:
194# copies[copy_number].fragments[fragment] = ExtendedDict()
195# copies[copy_number].fragments[fragment]['fragment'] = fragment
196#
197# #
198# # save the key and value using the copy and fragment
199# #
200# else:
201#
202# #
203# # match timestamp with Unix time in parentheses
204# #
205# match = re_nbu_datetime.match(line)
206# if match:
207# value = datetime.datetime.fromtimestamp(float(match.group(1)), tz)
208#
209# #
210# # separate type and id
211# #
212# elif re_type_id.match(value):
213# match = re_type_id.match(value)
214# idkey = '%s_id' % (key)
215# value = match.group(1)
216# copies[copy_number].fragments[fragment][idkey] = int(match.group(2))
217#
218# #
219# # ..otherwise autodetect
220# #
221# else:
222# value = autotype(value)
223#
224# copies[copy_number].fragments[fragment][key] = value
225#
226# image['copies'] = copies
227#
228
229 return image
230
231 except Exception, e:
232
233# for line in record:
234# print line
235
236 raise ParseError, e
237
238 else:
239
240 raise ParseError, 'Unknown format %s' % (format)
241
Note: See TracBrowser for help on using the repository browser.