-
Notifications
You must be signed in to change notification settings - Fork 1
/
table.py
428 lines (377 loc) · 20.1 KB
/
table.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
#!/usr/bin/env python
# -*- coding: utf-8 -*-
########################################################################
# DaleyKlippings
# Copyright (C) 2012-14 Clayton Daley III
# daleyklippings@gmail.com
#
# This program is free software; you can redistribute it and/or
# modify it under the terms of the GNU General Public License
# as published by the Free Software Foundation version 3.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
########################################################################
import logging
logger = logging.getLogger("daley_klippings.table")
logger.info("Loading DaleyKlippings Table Models")
"""
Table data model, proxy model, data edit delegates, parsing routine, default constants
"""
from settings import * # Includes re, PySide, pformat
import itertools
from datetime import datetime as dt
# Changed structure to list from dictionary to avoid problems with implementation of
# deleting rows function
class Clippings(list):
"""
Object to store all table data. Object structure:
- (headers)
- [
- {headers:
- {role:
- {item}}}]
"""
headers = HEADERS
def __init__(self):
list.__init__(self)
def import_csv(self, csv_reader):
detail = ''
try:
line = csv_reader.next()
except StopIteration:
return "CSV Import Failed\r\n\r\nNo data found.", \
'When loading first row, the CSV importer returned StopIteration, indicating that no data was ' + \
'available. However, the file seems to exist since we reached this point. Make sure you ' + \
'selected the correct file and that the file is in the correct format.'
headers = []
# We assume the top line is headers. Even if the headers aren't used, we need to know the identity of the
# column during import so we add them anyway.
for h in line:
logger.info("Adding %s to headers" % h)
headers.append(h)
# To ensure the table responds to all the right columns, we add the remaining headers. Our strategy later will
# set the value of these additional headers to None
missing_headers = 0
for h in self.headers:
if h not in headers:
missing_headers += 1
logger.info("Adding %s to headers" % h)
detail += '%s was not included in source data so it will be initialized with empty data.\r\n' % h
headers.append(h)
if missing_headers == len(self.headers):
return 'Error importing file. No valid headers found.', \
'The CSV Importer assumes that the first row is a list of headers. This tells DaleyKlippings ' + \
'how to map the CSV columns to data. When importing this first row, none of the columns matched ' + \
'the headers expected by DaleyKlippings. Please confirm that the headers are in English (not ' + \
'the translated versions) and use the same capitalization as the headers in the UI.'
# Now add the actual data, but don't rewind
for line in csv_reader:
logger.debug("Processing line %s" % pformat(line))
self.append(dict(itertools.izip_longest(headers, line)))
#self.append({(k, v) for k, v in dict(itertools.izip_longest(headers, line)) if k in self.headers})
logger.debug("... added")
logger.info("After import, object is %s" % pformat(self))
return 'CSV Import Completed', detail
def import_(self, my_clippings, import_settings):
"""
Parse My clippings.txt to fetch data
"""
detail = ''
delimiter = import_settings['Delimiter']
raw_clippings = my_clippings.split(delimiter)
if raw_clippings[-1].strip() == '':
raw_clippings.pop(-1)
try:
pattern = re.compile(import_settings['Pattern'], DEFAULT_RE_OPTIONS)
except Exception as error:
return u'The Import Pattern is invalid.', \
'Import Pattern resulted in the error:\n%s' % str(error.message)
date_format = import_settings['Date Format']
language_settings = import_settings['Application Settings']['Language']
date_language = language_settings['Date Language']
note_translation = language_settings['Note']
bookmark_translation = language_settings['Bookmark']
highlight_translation = language_settings['Highlight']
import_data = Clippings()
clipNo = 0
for raw_clipping in raw_clippings:
clipNo += 1
try:
clipping = pattern.search(raw_clipping.strip())
line = {}
emptyHeaders = 0
for h in self.headers:
try:
# Try to convert date to shorter format string, using standard datetime function
# as QDateTime support only local format strings.
# Date converted to QDateTime object for compatibility purpose.
if h == 'Date':
logger.debug("Original date is: '%s'" % clipping.group(h))
# Attempt to Localize Date
if date_language != 'English (default)':
logger.debug("... trying to localize date")
try:
local_language = QLocale(getattr(QLocale, date_language))
date = local_language.toDateTime(clipping.group(h), date_format).toPython()
logger.debug("... date converted to: '%s'" % str(date))
except Exception as e:
logger.exception("... error localizing date:\n%s" % e.message)
else:
# Attempt to Standardize Date
if u'%' in date_format:
# The % sign indicates that the pattern is a basic Python format
date = dt.strptime(clipping.group(h), date_format)
else:
# Otherwise, we assume a Qt Format
date = QDateTime.fromString(clipping.group(h), date_format).toPython()
line[h] = date
elif h == 'Note' and clipping.group('Type') == note_translation:
line[h] = clipping.group('Text')
elif h == 'Highlight' and clipping.group('Type') == highlight_translation:
line[h] = clipping.group('Text')
else:
line[h] = clipping.group(h)
except:
# If header is not found set it empty string
line[h] = ''
emptyHeaders += 1
if emptyHeaders == len(self.headers):
raise
import_data.append(line)
except Exception as e:
# Inform about invalid note
detail += u'\r\nWarning: note %d is empty or in wrong format: \r\n%s\r\n' % \
(clipNo, raw_clipping.strip())
logger.exception("Clipping number %s resulted in the exception: %s" % (clipNo, e.message))
continue
detail = u'<%s> %d out of %d clippings were successfully processed.\r\n%s' % (
QTime.currentTime().toString('hh:mm:ss'),
len(import_data),
clipNo,
detail)
# The original approach did this as lines were imported. Since Kindle now puts the note before the highlight,
# we need to post-process the data.
attachNotes = import_settings['Application Settings']['Attach Notes']['Attach Notes']
notesPosition = import_settings['Application Settings']['Attach Notes']['Notes Position']
range_indicator = language_settings['Range Separator']
matched = 0
if attachNotes == 'True':
skip = False # This makes it easy to skip subsequent rows
for row in range(len(import_data)):
# Once we match two lines, we don't want to process the second line again. This is especially
# problematic in Automatic mode since we could match both forward and backwards.
if skip:
skip = False
continue
# If the current row is a note, we want to check and see if the next row is a matching highlight
if import_data[row][u'Type'] in [note_translation, 'Note']:
# We've found a notes row
# Automatic prefers notes before highlights so we start there
# If the before match fails (or if the user chooses "After highlights"), we try the after match
if (
# We're looking for notes before highlights
# and there is a next row to analyze
# and the next row is a highlight
# and the name of the books match
# and either there is no location on the highlight or the note location falls in the highlight range
# and either there is no page or the highlight or the note page falls in the highlight range
notesPosition == 'Before highlights' or notesPosition == 'Automatic (default)') and \
row < len(import_data) - 1 and \
import_data[row + 1][u'Type'] == highlight_translation and \
import_data[row][u'Book'] == import_data[row + 1][u'Book'] and \
any(
(
int(u'-1') if import_data[row][u'Location'] is None else
int(import_data[row][u'Location'])) == s for s in (
[int(u'-1')] if import_data[row + 1][u'Location'] is None
else self.hyphen_range(import_data[row + 1][u'Location'],
range_indicator=range_indicator))
) and any(
(
int(u'-1') if import_data[row][u'Page'] is None else
int(import_data[row][u'Page']))== s for s in (
[int(u'-1')] if import_data[row + 1][u'Page'] is None \
else self.hyphen_range(import_data[row + 1][u'Page'],
range_indicator=range_indicator))
):
import_data[row][u'Highlight'] = import_data[row + 1][u'Highlight']
import_data[row][u'Location'] = import_data[row + 1][u'Location']
self.append(import_data[row])
matched += 1
skip = True
elif (
# We're looking for notes after highlights
# and there is a previous row to analyze
# and the previous row is a highlight
# and the name of the books match
# and either there is no location on the highlight or the note location falls in the highlight range
# and either there is no page or the highlight or the note page falls in the highlight range
notesPosition == 'After highlights'
or notesPosition == 'Automatic (default)') and \
row > 0 and \
import_data[row - 1][u'Type'] == highlight_translation and \
import_data[row][u'Book'] == \
import_data[row - 1][u'Book'] and \
any(
(
int(u'-1') if import_data[row][u'Location'] is None else
int(import_data[row][u'Location'])) == s for s in (
[int(u'-1')] if import_data[row - 1][u'Location'] is None else
self.hyphen_range(import_data[row - 1][u'Location'],
range_indicator=range_indicator))
) and any(
(
int(u'-1') if import_data[row][u'Page'] is None else
int(import_data[row][u'Page'])) == s for s in (
[int(u'-1')] if import_data[row - 1][u'Page'] is None else
self.hyphen_range(import_data[row - 1][u'Page'],
range_indicator=range_indicator))
):
# In case the auto matcher already matched and skipped the previous highlight
if self[len(self) - 1][u'Type'] == highlight_translation:
# If not, edit the highlight's entry in tableData
self[len(self) - 1][u'Note'] = import_data[row][u'Note']
self[len(self) - 1][u'Type'] = import_data[row][u'Type']
else:
# If so, attach the highlight to the new note as well
import_data[row][u'Highlight'] = import_data[row - 1][u'Highlight']
self.append(import_data[row])
matched += 1
else:
self.append(import_data[row])
else:
self.append(import_data[row])
else: # if attach notes flag is not on
for row in import_data:
self.append(row)
# Pop Import Status Box
summary = u'%d out of %d clippings were successfully processed%s' % (len(import_data), clipNo, u' ' * 50)
if len(import_data) == 0 and clipNo > 0:
summary += u'Please verify that you selected the right file or try a different Import Pattern.' + u' ' * 50 + \
u'\r\n\r\nIf none of the built-in patterns work, please contact daleyklippings@claytondaley.com.' + u' ' * 50
else:
if attachNotes == 'True':
summary += u'\r\n - We were able to match %d Note%s with a Highlight %s' % \
(matched, ('s' if matched > 1 else ''), u' ' * 50)
if matched > 0:
summary += u'\r\n - As a result, fewer lines will show up in the interface.' + u' ' * 50
return summary, detail
def hyphen_range(self, s, range_indicator='-'):
""" Takes a range in form of "a-b" and generate a list of numbers between a and b inclusive.
Also accepts comma separated ranges like "a-b,c-d,f" will build a list which will include
Numbers from a to b, a to d and f """
if s is None:
return []
s = u''.join(s.split()) #removes white space
r = set()
for x in s.split(','):
t = x.split(range_indicator)
if len(t) not in [1, 2]: raise SyntaxError(
"hash_range is given its argument as %s which seems not correctly formatted." % s)
# To support ranges like 2014-52 which really mean 2014-2052
if len(t) == 2 and len(t[0]) > len(t[1]):
t[1] = t[0][:(len(t[0]) - len(t[1]))] + t[1]
r.add(int(t[0])) if len(t) == 1 else r.update(set(range(int(t[0]), int(t[1]) + 1)))
l = list(r)
l.sort()
return l
class TableModel(QAbstractTableModel):
"""
Table model, all the data are stored in the Clippings object tableData.
Returns status string.
"""
table_data = Clippings()
def __init__(self, parent=None):
QAbstractTableModel.__init__(self, parent)
self.table_data = Clippings()
def parse(self, my_clippings, import_settings, append=True):
"""
Parse data in my_clippings using pattern in import_settings
"""
self.beginResetModel()
# Clear previous data
if not append:
self.reset()
# Consider loading default import_settings if import_settings is None
if import_settings is None:
raise ValueError("Import Pattern not selected.")
summary, detail = self.table_data.import_(my_clippings=my_clippings, import_settings=import_settings)
self.endResetModel()
return summary, detail
def from_csv(self, csv_reader, append=True):
"""
Update
"""
self.beginResetModel()
# Clear previous data
if not append:
self.reset()
summary, detail = self.table_data.import_csv(csv_reader=csv_reader)
self.endResetModel()
return summary, detail
def reset(self):
self.table_data = Clippings()
def rowCount(self, index):
return len(self.table_data)
def columnCount(self, index):
return len(self.table_data.headers)
def data(self, index, role):
row = index.row()
column = index.column()
if role == Qt.DisplayRole or role == Qt.EditRole:
return self.table_data[row][self.table_data.headers[column]]
def headerData(self, section, orientation, role):
if orientation == Qt.Horizontal:
if role == Qt.DisplayRole:
return self.table_data.headers[section]
if orientation == Qt.Vertical:
if role == Qt.DisplayRole:
return section + 1
def setData(self, index, value, role):
if role == Qt.EditRole:
self.table_data[index.row()][self.table_data.headers[index.column()]] = value
"""
if self.table_data.headers[index.column()] == 'Date':
# This is necessary because Qt uses a QVariant to get around typing issues
self.table_data[index.row()][self.table_data.headers[index.column()]] = value.toPython()
else:
# This is necessary because Qt uses a QVariant to get around typing issues
self.table_data[index.row()][self.table_data.headers[index.column()]] = value
"""
self.emit(SIGNAL('dataChanged(QModelIndex, QModelIndex)'), index, index)
return True
def removeRows(self, row, count, parent):
self.beginRemoveRows(parent, row, row + count - 1)
del self.table_data[row]
self.endRemoveRows()
return True
def flags(self, index):
return Qt.ItemIsSelectable | \
Qt.ItemIsEditable | \
Qt.ItemIsEnabled | \
Qt.ItemIsDragEnabled
def mimeTypes(self):
types = ['application/vnd.text.list', ]
return types
def mimeData(self, indexes):
mimeData = QMimeData()
text = ''
# Sort indexes, because sometimes they are given in wrong order
indexes.sort()
for i in range(0, len(indexes), len(self.table_data.headers)):
if indexes[i].column() == 0:
text += '%s\r\n- %s Loc. %s | Added on %s\r\n\r\n%s\r\n==========\r\n' % \
(self.data(indexes[i], Qt.DisplayRole),
self.data(indexes[i + 1], Qt.DisplayRole),
self.data(indexes[i + 2], Qt.DisplayRole),
self.data(indexes[i + 3], Qt.EditRole).toString('dddd, MMMM dd, yyyy, hh:mm AP'),
self.data(indexes[i + 4], Qt.DisplayRole))
mimeData.setText(text)
return mimeData