1
=== added file 'recipes/idg_se.recipe'
2
--- recipes/idg_se.recipe	1970-01-01 00:00:00 +0000
3
+++ recipes/idg_se.recipe	2011-07-22 18:03:36 +0000
4
@@ -0,0 +1,33 @@
5
1
__license__ = 'GPLv3'
6
2
7
3
from calibre.web.feeds.news import BasicNewsRecipe
8
4
9
5
class IDGse(BasicNewsRecipe):
10
6
    title               = 'IDG'
11
7
    description = 'IDG.se'
12
8
    language = 'se'
13
9
    __author__ = 'zapt0'
14
10
    oldest_article = 1
15
11
    max_articles_per_feed = 40
16
12
    no_stylesheets = True
17
13
    encoding = 'ISO-8859-1'
18
14
    remove_javascript = True
19
15
20
16
    feeds          = [(u'Senaste nytt',u'http://feeds.idg.se/idg/vzzs')]
21
17
22
18
    def print_version(self,url):
23
19
            return url + '?articleRenderMode=print&m=print'
24
20
25
21
    def get_cover_url(this):
26
22
        return 'http://idgmedia.idg.se/polopoly_fs/2.3275!images/idgmedia_logo_75.jpg'
27
23
28
24
    keep_only_tags = [
29
25
                                            dict(name='h1'),
30
26
                                            dict(name='div', attrs={'class':['divColumn1Article']}),
31
27
                                            ]
32
28
    #remove ads
33
29
    remove_tags = [
34
30
                                    dict(name='div', attrs={'id':['preamble_ad']}),
35
31
                                    dict(name='ul', attrs={'class':['share']})
36
32
                                ]
37
33
38
0
34
39
=== modified file 'recipes/united_daily.recipe'
40
--- recipes/united_daily.recipe	2011-05-17 15:30:51 +0000
41
+++ recipes/united_daily.recipe	2011-07-22 18:03:36 +0000
42
@@ -64,7 +64,7 @@
43
64
64
44
65
    __author__ = 'Eddie Lau'
65
    __author__ = 'Eddie Lau'
45
66
    __version__ = '1.1'
66
    __version__ = '1.1'
47
67
    language = 'zh-TW'
67
    language = 'zh_TW'
48
68
    publisher = 'United Daily News Group'
68
    publisher = 'United Daily News Group'
49
69
    description = 'United Daily (Taiwan)'
69
    description = 'United Daily (Taiwan)'
50
70
    category = 'News, Chinese, Taiwan'
70
    category = 'News, Chinese, Taiwan'
51
71
71
52
=== added file 'recipes/utrinski.recipe'
53
--- recipes/utrinski.recipe	1970-01-01 00:00:00 +0000
54
+++ recipes/utrinski.recipe	2011-07-22 18:03:36 +0000
55
@@ -0,0 +1,71 @@
56
1
#!/usr/bin/env  python
57
2
58
3
__license__   = 'GPL v3'
59
4
__copyright__ = '2011, Darko Spasovski <darko.spasovski at gmail.com>'
60
5
'''
61
6
utrinski.com.mk
62
7
'''
63
8
64
9
import re
65
10
import datetime
66
11
from calibre.web.feeds.news import BasicNewsRecipe
67
12
68
13
class UtrinskiVesnik(BasicNewsRecipe):
69
14
70
15
    __author__            = 'Darko Spasovski'
71
16
    INDEX                 = 'http://www.utrinski.com.mk/'
72
17
    title                 = 'Utrinski Vesnik'
73
18
    description           = 'Daily Macedonian newspaper'
74
19
    masthead_url          = 'http://www.utrinski.com.mk/images/LogoTop.jpg'
75
20
    language              = 'mk'
76
21
    remove_javascript     = True
77
22
    publication_type      = 'newspaper'
78
23
    category              = 'news, Macedonia'
79
24
    oldest_article        = 2
80
25
    max_articles_per_feed = 100
81
26
    no_stylesheets        = True
82
27
    use_embedded_content  = False
83
28
    preprocess_regexps    = [(re.compile(i[0], re.IGNORECASE | re.DOTALL), i[1]) for i in
84
29
    [
85
30
        ## Remove anything before the start of the article.
86
31
        (r'<body.*?Article start-->', lambda match: '<body>'),
87
32
88
33
        ## Remove anything after the end of the article.
89
34
        (r'<!--Article end.*?</body>', lambda match : '</body>'),
90
35
        ]
91
36
    ]
92
37
    extra_css             = """
93
38
                                body{font-family: Arial,Helvetica,sans-serif}
94
39
                                .WB_UTRINSKIVESNIK_Naslov{FONT-WEIGHT: bold; FONT-SIZE: 18px; FONT-FAMILY: Arial, Verdana, Tahoma; TEXT-DECORATION: none}
95
40
                            """
96
41
97
42
    conversion_options = {
98
43
                          'comment'  : description,
99
44
                          'tags'     : category,
100
45
                          'language' : language,
101
46
                          'linearize_tables' : True
102
47
                        }
103
48
104
49
    def parse_index(self):
105
50
        soup = self.index_to_soup(self.INDEX)
106
51
        feeds = []
107
52
        for section in soup.findAll('a', attrs={'class':'WB_UTRINSKIVESNIK_TOCTitleBig'}):
108
53
            sectionTitle = section.contents[0].string
109
54
            tocItemTable = section.findAllPrevious('table')[1]
110
55
            if tocItemTable is None: continue
111
56
            articles = []
112
57
            while True:
113
58
                tocItemTable = tocItemTable.nextSibling
114
59
                if tocItemTable is None: break
115
60
                article = tocItemTable.findAll('a', attrs={'class': 'WB_UTRINSKIVESNIK_TocItem'})
116
61
                if len(article)==0: break
117
62
                title = self.tag_to_string(article[0], use_alt=True).strip()
118
63
                articles.append({'title': title, 'url':'http://www.utrinski.com.mk/' + article[0]['href'], 'description':'', 'date':''})
119
64
            if articles:
120
65
                feeds.append((sectionTitle, articles))
121
66
        return feeds
122
67
123
68
124
69
    def get_cover_url(self):
125
70
        datum = datetime.datetime.today().strftime('%d_%m_%Y')
126
71
        return 'http://www.utrinski.com.mk/WBStorage/Files/' + datum + '.jpg'
127
0
72
128
=== modified file 'src/calibre/customize/builtins.py'
129
--- src/calibre/customize/builtins.py	2011-07-19 22:48:25 +0000
130
+++ src/calibre/customize/builtins.py	2011-07-22 18:03:36 +0000
131
@@ -1258,6 +1258,16 @@
132
1258
    formats = ['EPUB', 'PDF']
1258
    formats = ['EPUB', 'PDF']
133
1259
    affiliate = True
1259
    affiliate = True
134
1260
1260
135
1261
class StoreEKnigiStore(StoreBase):
136
1262
    name = u'еКниги'
137
1263
    author = 'Alex Stanev'
138
1264
    description = u'Онлайн книжарница за електронни книги и аудио риалити романи'
139
1265
    actual_plugin = 'calibre.gui2.store.stores.eknigi_plugin:eKnigiStore'
140
1266
141
1267
    headquarters = 'BG'
142
1268
    formats = ['EPUB', 'PDF', 'HTML']
143
1269
    #affiliate = True
144
1270
145
1261
class StoreEpubBudStore(StoreBase):
1271
class StoreEpubBudStore(StoreBase):
146
1262
    name = 'ePub Bud'
1272
    name = 'ePub Bud'
147
1263
    description = 'Well, it\'s pretty much just "YouTube for Children\'s eBooks. A not-for-profit organization devoted to brining self published childrens books to the world.'
1273
    description = 'Well, it\'s pretty much just "YouTube for Children\'s eBooks. A not-for-profit organization devoted to brining self published childrens books to the world.'
148
@@ -1483,6 +1493,7 @@
149
1483
    StoreEBookShoppeUKStore,
1493
    StoreEBookShoppeUKStore,
150
1484
#    StoreEPubBuyDEStore,
1494
#    StoreEPubBuyDEStore,
151
1485
    StoreEHarlequinStore,
1495
    StoreEHarlequinStore,
152
1496
    StoreEKnigiStore,
153
1486
    StoreEpubBudStore,
1497
    StoreEpubBudStore,
154
1487
    StoreFeedbooksStore,
1498
    StoreFeedbooksStore,
155
1488
    StoreFoylesUKStore,
1499
    StoreFoylesUKStore,
156
1489
1500
157
=== modified file 'src/calibre/devices/android/driver.py'
158
--- src/calibre/devices/android/driver.py	2011-07-16 16:01:32 +0000
159
+++ src/calibre/devices/android/driver.py	2011-07-22 18:03:36 +0000
160
@@ -47,10 +47,12 @@
161
47
47
162
48
            # Google
48
            # Google
163
49
            0x18d1 : {
49
            0x18d1 : {
164
50
                0x0001 : [0x0223],
165
50
                0x4e11 : [0x0100, 0x226, 0x227],
51
                0x4e11 : [0x0100, 0x226, 0x227],
169
51
                0x4e12: [0x0100, 0x226, 0x227],
52
                0x4e12 : [0x0100, 0x226, 0x227],
170
52
                0x4e21: [0x0100, 0x226, 0x227],
53
                0x4e21 : [0x0100, 0x226, 0x227],
171
53
                0xb058: [0x0222, 0x226, 0x227]},
54
                0xb058 : [0x0222, 0x226, 0x227]
172
55
            },
173
54
56
174
55
            # Samsung
57
            # Samsung
175
56
            0x04e8 : { 0x681d : [0x0222, 0x0223, 0x0224, 0x0400],
58
            0x04e8 : { 0x681d : [0x0222, 0x0223, 0x0224, 0x0400],
176
57
59
177
=== modified file 'src/calibre/devices/eb600/driver.py'
178
--- src/calibre/devices/eb600/driver.py	2011-06-07 00:26:05 +0000
179
+++ src/calibre/devices/eb600/driver.py	2011-07-22 18:03:36 +0000
180
@@ -35,9 +35,9 @@
181
35
    PRODUCT_ID  = [0x1688]
35
    PRODUCT_ID  = [0x1688]
182
36
    BCD         = [0x110]
36
    BCD         = [0x110]
183
37
37
187
38
    VENDOR_NAME      = ['NETRONIX', 'WOLDER']
38
    VENDOR_NAME      = ['NETRONIX', 'WOLDER', 'MD86371']
188
39
    WINDOWS_MAIN_MEM = ['EBOOK', 'MIBUK_GAMMA_6.2']
39
    WINDOWS_MAIN_MEM = ['EBOOK', 'MIBUK_GAMMA_6.2', 'MD86371']
189
40
    WINDOWS_CARD_A_MEM = 'EBOOK'
40
    WINDOWS_CARD_A_MEM = ['EBOOK', 'MD86371']
190
41
41
191
42
    OSX_MAIN_MEM = 'EB600 Internal Storage Media'
42
    OSX_MAIN_MEM = 'EB600 Internal Storage Media'
192
43
    OSX_CARD_A_MEM = 'EB600 Card Storage Media'
43
    OSX_CARD_A_MEM = 'EB600 Card Storage Media'
193
44
44
194
=== modified file 'src/calibre/ebooks/mobi/debug.py'
195
--- src/calibre/ebooks/mobi/debug.py	2011-07-20 20:01:41 +0000
196
+++ src/calibre/ebooks/mobi/debug.py	2011-07-22 18:03:36 +0000
197
@@ -8,7 +8,7 @@
198
8
__docformat__ = 'restructuredtext en'
8
__docformat__ = 'restructuredtext en'
199
9
9
200
10
import struct, datetime, sys, os, shutil
10
import struct, datetime, sys, os, shutil
202
11
from collections import OrderedDict
11
from collections import OrderedDict, defaultdict
203
12
from calibre.utils.date import utc_tz
12
from calibre.utils.date import utc_tz
204
13
from calibre.ebooks.mobi.langcodes import main_language, sub_language
13
from calibre.ebooks.mobi.langcodes import main_language, sub_language
205
14
from calibre.ebooks.mobi.utils import (decode_hex_number, decint,
14
from calibre.ebooks.mobi.utils import (decode_hex_number, decint,
206
@@ -530,21 +530,21 @@
207
530
            },
530
            },
208
531
531
209
532
            'chapter_with_subchapters' : {
532
            'chapter_with_subchapters' : {
212
533
                    22 : ('First subchapter index', 'first_subchapter_index'),
533
                    22 : ('First subchapter index', 'first_child_index'),
213
534
                    23 : ('Last subchapter index', 'last_subchapter_index'),
534
                    23 : ('Last subchapter index', 'last_child_index'),
214
535
            },
535
            },
215
536
536
216
537
            'periodical' : {
537
            'periodical' : {
217
538
                    5  : ('Class offset in cncx', 'class_offset'),
538
                    5  : ('Class offset in cncx', 'class_offset'),
220
539
                    22 : ('First section index', 'first_section_index'),
539
                    22 : ('First section index', 'first_child_index'),
221
540
                    23 : ('Last section index', 'last_section_index'),
540
                    23 : ('Last section index', 'last_child_index'),
222
541
            },
541
            },
223
542
542
224
543
            'section' : {
543
            'section' : {
225
544
                    5  : ('Class offset in cncx', 'class_offset'),
544
                    5  : ('Class offset in cncx', 'class_offset'),
229
545
                    21 : ('Periodical index', 'periodical_index'),
545
                    21 : ('Periodical index', 'parent_index'),
230
546
                    22 : ('First article index', 'first_article_index'),
546
                    22 : ('First article index', 'first_child_index'),
231
547
                    23 : ('Last article index', 'last_article_index'),
547
                    23 : ('Last article index', 'last_child_index'),
232
548
            },
548
            },
233
549
    }
549
    }
234
550
550
235
@@ -625,11 +625,56 @@
236
625
                return tag.cncx_value
625
                return tag.cncx_value
237
626
        return ''
626
        return ''
238
627
627
239
628
    @property
240
629
    def offset(self):
241
630
        for tag in self.tags:
242
631
            if tag.attr == 'offset':
243
632
                return tag.value
244
633
        return 0
245
634
246
635
    @property
247
636
    def size(self):
248
637
        for tag in self.tags:
249
638
            if tag.attr == 'size':
250
639
                return tag.value
251
640
        return 0
252
641
253
642
    @property
254
643
    def depth(self):
255
644
        for tag in self.tags:
256
645
            if tag.attr == 'depth':
257
646
                return tag.value
258
647
        return 0
259
648
260
649
    @property
261
650
    def parent_index(self):
262
651
        for tag in self.tags:
263
652
            if tag.attr == 'parent_index':
264
653
                return tag.value
265
654
        return -1
266
655
267
656
    @property
268
657
    def first_child_index(self):
269
658
        for tag in self.tags:
270
659
            if tag.attr == 'first_child_index':
271
660
                return tag.value
272
661
        return -1
273
662
274
663
    @property
275
664
    def last_child_index(self):
276
665
        for tag in self.tags:
277
666
            if tag.attr == 'last_child_index':
278
667
                return tag.value
279
668
        return -1
280
669
281
628
    def __str__(self):
670
    def __str__(self):
282
629
        ans = ['Index Entry(index=%s, entry_type=%s, length=%d)'%(
671
        ans = ['Index Entry(index=%s, entry_type=%s, length=%d)'%(
283
630
            self.index, self.entry_type, len(self.tags))]
672
            self.index, self.entry_type, len(self.tags))]
284
631
        for tag in self.tags:
673
        for tag in self.tags:
285
632
            ans.append('\t'+str(tag))
674
            ans.append('\t'+str(tag))
286
675
        if self.first_child_index != -1:
287
676
            ans.append('\tNumber of children: %d'%(self.last_child_index -
288
677
                self.first_child_index + 1))
289
633
        return '\n'.join(ans)
678
        return '\n'.join(ans)
290
634
679
291
635
# }}}
680
# }}}
292
@@ -679,6 +724,15 @@
293
679
            entry_type = ord(indxt[off+consumed])
724
            entry_type = ord(indxt[off+consumed])
294
680
            self.indices.append(IndexEntry(index, entry_type,
725
            self.indices.append(IndexEntry(index, entry_type,
295
681
                indxt[off+consumed+1:next_off], cncx, index_header.tagx_entries))
726
                indxt[off+consumed+1:next_off], cncx, index_header.tagx_entries))
296
727
            index = self.indices[-1]
297
728
298
729
    def get_parent(self, index):
299
730
        if index.depth < 1:
300
731
            return None
301
732
        parent_depth = index.depth - 1
302
733
        for p in self.indices:
303
734
            if p.depth != parent_depth:
304
735
                continue
305
682
736
306
683
737
307
684
    def __str__(self):
738
    def __str__(self):
308
@@ -793,6 +847,231 @@
309
793
847
310
794
# }}}
848
# }}}
311
795
849
312
850
class TBSIndexing(object): # {{{
313
851
314
852
    def __init__(self, text_records, indices, doc_type):
315
853
        self.record_indices = OrderedDict()
316
854
        self.doc_type = doc_type
317
855
        self.indices = indices
318
856
        pos = 0
319
857
        for r in text_records:
320
858
            start = pos
321
859
            pos += len(r.raw)
322
860
            end = pos - 1
323
861
            self.record_indices[r] = x = {'starts':[], 'ends':[],
324
862
                    'complete':[], 'geom': (start, end)}
325
863
            for entry in indices:
326
864
                istart, sz = entry.offset, entry.size
327
865
                iend = istart + sz - 1
328
866
                has_start = istart >= start and istart <= end
329
867
                has_end = iend >= start and iend <= end
330
868
                rec = None
331
869
                if has_start and has_end:
332
870
                    rec = 'complete'
333
871
                elif has_start and not has_end:
334
872
                    rec = 'starts'
335
873
                elif not has_start and has_end:
336
874
                    rec = 'ends'
337
875
                if rec:
338
876
                    x[rec].append(entry)
339
877
340
878
    def get_index(self, idx):
341
879
        for i in self.indices:
342
880
            if i.index == idx: return i
343
881
        raise IndexError('Index %d not found'%idx)
344
882
345
883
    def __str__(self):
346
884
        ans = ['*'*20 + ' TBS Indexing (%d records) '%len(self.record_indices)+ '*'*20]
347
885
        for r, dat in self.record_indices.iteritems():
348
886
            ans += self.dump_record(r, dat)[-1]
349
887
        return '\n'.join(ans)
350
888
351
889
    def dump(self, bdir):
352
890
        types = defaultdict(list)
353
891
        for r, dat in self.record_indices.iteritems():
354
892
            tbs_type, strings = self.dump_record(r, dat)
355
893
            if tbs_type == 0: continue
356
894
            types[tbs_type] += strings
357
895
        for typ, strings in types.iteritems():
358
896
            with open(os.path.join(bdir, 'tbs_type_%d.txt'%typ), 'wb') as f:
359
897
                f.write('\n'.join(strings))
360
898
361
899
    def dump_record(self, r, dat):
362
900
        ans = []
363
901
        ans.append('\nRecord #%d: Starts at: %d Ends at: %d'%(r.idx,
364
902
            dat['geom'][0], dat['geom'][1]))
365
903
        s, e, c = dat['starts'], dat['ends'], dat['complete']
366
904
        ans.append(('\tContains: %d index entries '
367
905
            '(%d ends, %d complete, %d starts)')%tuple(map(len, (s+e+c, e,
368
906
                c, s))))
369
907
        byts = bytearray(r.trailing_data.get('indexing', b''))
370
908
        sbyts = tuple(hex(b)[2:] for b in byts)
371
909
        ans.append('TBS bytes: %s'%(' '.join(sbyts)))
372
910
        for typ, entries in (('Ends', e), ('Complete', c), ('Starts', s)):
373
911
            if entries:
374
912
                ans.append('\t%s:'%typ)
375
913
                for x in entries:
376
914
                    ans.append(('\t\tIndex Entry: %d (Parent index: %d, '
377
915
                            'Depth: %d, Offset: %d, Size: %d) [%s]')%(
378
916
                        x.index, x.parent_index, x.depth, x.offset, x.size, x.label))
379
917
        def bin3(num):
380
918
            ans = bin(num)[2:]
381
919
            return '0'*(3-len(ans)) + ans
382
920
383
921
        tbs_type = 0
384
922
        if len(byts):
385
923
            outer, consumed = decint(byts)
386
924
            byts = byts[consumed:]
387
925
            tbs_type = outer & 0b111
388
926
            ans.append('TBS Type: %s (%d)'%(bin3(tbs_type), tbs_type))
389
927
            ans.append('Outer Index entry: %d'%(outer >> 3))
390
928
            arg1, consumed = decint(byts)
391
929
            byts = byts[consumed:]
392
930
            ans.append('Unknown (vwi: always 0?): %d'%arg1)
393
931
            if self.doc_type in (257, 259): # Hierarchical periodical
394
932
                byts, a = self.interpret_periodical(tbs_type, byts)
395
933
                ans += a
396
934
            if byts:
397
935
                sbyts = tuple(hex(b)[2:] for b in byts)
398
936
                ans.append('Remaining bytes: %s'%' '.join(sbyts))
399
937
400
938
        ans.append('')
401
939
        return tbs_type, ans
402
940
403
941
    def interpret_periodical(self, tbs_type, byts):
404
942
        ans = []
405
943
406
944
        def tbs_type_6(byts, psi=None, msg=None): # {{{
407
945
            if psi is None:
408
946
                # Assume parent section is 1
409
947
                psi = self.get_index(1)
410
948
            if msg is None:
411
949
                msg = ('Article index at start of record or first article'
412
950
                    ' index, relative to parent section')
413
951
            if byts:
414
952
                # byts could be empty
415
953
                arg, consumed = decint(byts)
416
954
                byts = byts[consumed:]
417
955
                flags = (arg & 0b1111)
418
956
                ai = (arg >> 4)
419
957
                ans.append('%s (fvwi): %d [%d absolute]'%(msg, ai,
420
958
                        ai+psi.index))
421
959
                if flags == 1:
422
960
                    arg, consumed = decint(byts)
423
961
                    byts = byts[consumed:]
424
962
                    ans.append('EOF (vwi: should be 0): %d'%arg)
425
963
                elif flags in (4, 5):
426
964
                    num = byts[0]
427
965
                    byts = byts[1:]
428
966
                    ans.append('Number of article nodes in the record (byte): %d'%num)
429
967
                    if flags == 5:
430
968
                        arg, consumed = decint(byts)
431
969
                        byts = byts[consumed:]
432
970
                        ans.append('Unknown ??? (vwi)): %d'%(arg))
433
971
                elif flags == 0:
434
972
                    pass
435
973
                else:
436
974
                    raise ValueError('Unknown flags: %d'%flags)
437
975
            return byts
438
976
439
977
        # }}}
440
978
441
979
        if tbs_type == 3: # {{{
442
980
            arg2, consumed = decint(byts)
443
981
            byts = byts[consumed:]
444
982
            ans.append('Unknown (vwi: always 0?): %d'%arg2)
445
983
446
984
            arg3, consumed = decint(byts)
447
985
            byts = byts[consumed:]
448
986
            fsi = arg3 >> 4
449
987
            extra = arg3 & 0b1111
450
988
            ans.append('First section index (fvwi): %d'%fsi)
451
989
            psi = self.get_index(fsi)
452
990
            ans.append('Extra bits (flag: always 0?): %d'%extra)
453
991
454
992
            byts = tbs_type_6(byts, psi=psi,
455
993
                    msg=('First article of ending section, relative to its'
456
994
                    ' parent\'s index'))
457
995
            if byts:
458
996
                # We have a transition not just an opening first section
459
997
                psi = self.get_index(psi.index+1)
460
998
                arg, consumed = decint(byts)
461
999
                off = arg >> 4
462
1000
                byts = byts[consumed:]
463
1001
                flags = arg & 0b1111
464
1002
                ans.append('Last article of ending section w.r.t. starting'
465
1003
                        ' section offset (fvwi): %d [%d absolute]'%(off,
466
1004
                            psi.index+off))
467
1005
                ans.append('Flags (always 8?): %d'%flags)
468
1006
                byts = tbs_type_6(byts, psi=psi)
469
1007
            # }}}
470
1008
471
1009
        elif tbs_type == 7: # {{{
472
1010
            # This occurs for records that have no section nodes and
473
1011
            # whose parent section's index == 1
474
1012
            ans.append('Unknown (maybe vwi?): %r'%bytes(byts[:2]))
475
1013
            byts = byts[2:]
476
1014
            arg, consumed = decint(byts)
477
1015
            byts = byts[consumed:]
478
1016
            ai = arg >> 4
479
1017
            flags = arg & 0b1111
480
1018
            ans.append('Article at start of record (fvwi): %d'%ai)
481
1019
            if flags == 4:
482
1020
                num = byts[0]
483
1021
                byts = byts[1:]
484
1022
                ans.append('Number of articles in record (byte): %d'%num)
485
1023
            elif flags == 0:
486
1024
                pass
487
1025
            elif flags == 1:
488
1026
                arg, consumed = decint(byts)
489
1027
                byts = byts[consumed:]
490
1028
                ans.append('EOF (vwi: should be 0): %d'%arg)
491
1029
            else:
492
1030
                raise ValueError('Unknown flags value: %d'%flags)
493
1031
        # }}}
494
1032
495
1033
        elif tbs_type == 6: # {{{
496
1034
            # This is used for records spanned by an article whose parent
497
1035
            # section's index == 1 or for the opening record if it contains the
498
1036
            # periodical start, section 1 start and at least one article. The
499
1037
            # two cases are distinguished by the flags on the article index
500
1038
            # vwi.
501
1039
            unk = byts[0]
502
1040
            byts = byts[1:]
503
1041
            ans.append('Unknown (byte: always 2?): %d'%unk)
504
1042
            byts = tbs_type_6(byts)
505
1043
        # }}}
506
1044
507
1045
        elif tbs_type == 2: # {{{
508
1046
            # This occurs for records with no section nodes and whose parent
509
1047
            # section's index != 1 (undefined (records before the first
510
1048
            # section) or > 1)
511
1049
            # This is also used for records that are spanned by an article
512
1050
            # whose parent section index > 1. In this case the flags of the
513
1051
            # vwi referring to the article at the start
514
1052
            # of the record are set to 1 instead of 4.
515
1053
            arg, consumed = decint(byts)
516
1054
            byts = byts[consumed:]
517
1055
            flags = (arg & 0b1111)
518
1056
            psi = (arg >> 4)
519
1057
            ans.append('Parent section index (fvwi): %d'%psi)
520
1058
            psi = self.get_index(psi)
521
1059
            ans.append('Flags: %d'%flags)
522
1060
            if flags == 1:
523
1061
                arg, consumed = decint(byts)
524
1062
                byts = byts[consumed:]
525
1063
                ans.append('Unknown (vwi?: always 0?): %d'%arg)
526
1064
                byts = tbs_type_6(byts, psi=psi)
527
1065
            elif flags == 0:
528
1066
                byts = tbs_type_6(byts, psi=psi)
529
1067
            else:
530
1068
                raise ValueError('Unkown flags: %d'%flags)
531
1069
        # }}}
532
1070
533
1071
        return byts, ans
534
1072
535
1073
# }}}
536
1074
537
796
class MOBIFile(object): # {{{
1075
class MOBIFile(object): # {{{
538
797
1076
539
798
    def __init__(self, stream):
1077
    def __init__(self, stream):
540
@@ -874,6 +1153,9 @@
541
874
            else:
1153
            else:
542
875
                self.binary_records.append(BinaryRecord(i, r))
1154
                self.binary_records.append(BinaryRecord(i, r))
543
876
1155
544
1156
        if self.index_record is not None:
545
1157
            self.tbs_indexing = TBSIndexing(self.text_records,
546
1158
                    self.index_record.indices, self.mobi_header.type_raw)
547
877
1159
548
878
    def print_header(self, f=sys.stdout):
1160
    def print_header(self, f=sys.stdout):
549
879
        print (str(self.palmdb).encode('utf-8'), file=f)
1161
        print (str(self.palmdb).encode('utf-8'), file=f)
550
@@ -905,6 +1187,9 @@
551
905
            print(str(f.cncx).encode('utf-8'), file=out)
1187
            print(str(f.cncx).encode('utf-8'), file=out)
552
906
            print('\n\n', file=out)
1188
            print('\n\n', file=out)
553
907
            print(str(f.index_record), file=out)
1189
            print(str(f.index_record), file=out)
554
1190
        with open(os.path.join(ddir, 'tbs_indexing.txt'), 'wb') as out:
555
1191
            print(str(f.tbs_indexing), file=out)
556
1192
        f.tbs_indexing.dump(ddir)
557
908
1193
558
909
    for tdir, attr in [('text', 'text_records'), ('images', 'image_records'),
1194
    for tdir, attr in [('text', 'text_records'), ('images', 'image_records'),
559
910
            ('binary', 'binary_records')]:
1195
            ('binary', 'binary_records')]:
560
911
1196
561
=== added file 'src/calibre/ebooks/mobi/tbs_periodicals.rst'
562
--- src/calibre/ebooks/mobi/tbs_periodicals.rst	1970-01-01 00:00:00 +0000
563
+++ src/calibre/ebooks/mobi/tbs_periodicals.rst	2011-07-22 18:03:36 +0000
564
@@ -0,0 +1,189 @@
565
1
Reverse engineering the trailing byte sequences for hierarchical periodicals
566
2
===============================================================================
567
3
568
4
In the following, *vwi* means variable width integer and *fvwi* means a vwi whose lowest four bits are used as a flag.
569
5
570
6
Opening record
571
7
----------------
572
8
573
9
The text record that contains the opening node for the periodical (depth=0 node in the NCX) can have TBS of 3 different forms:
574
10
575
11
    1. If it has only the periodical node and no section/article nodes, TBS of type 2, like this::
576
12
577
13
            Record #1: Starts at: 0 Ends at: 4095
578
14
                Contains: 1 index entries (0 ends, 0 complete, 1 starts)
579
15
            TBS bytes: 82 80
580
16
                Starts:
581
17
                    Index Entry: 0 (Parent index: -1, Depth: 0, Offset: 215, Size: 68470) [j_x's Google reader]
582
18
            TBS Type: 010 (2)
583
19
            Outer Index entry: 0
584
20
            Unknown (vwi: always 0?): 0
585
21
586
22
    2. A periodical and a section node, but no article nodes, TBS type of 6, like this::
587
23
588
24
            Record #1: Starts at: 0 Ends at: 4095
589
25
                Contains: 2 index entries (0 ends, 0 complete, 2 starts)
590
26
            TBS bytes: 86 80 2
591
27
                Starts:
592
28
                    Index Entry: 0 (Parent index: -1, Depth: 0, Offset: 215, Size: 93254) [j_x's Google reader]
593
29
                    Index Entry: 1 (Parent index: 0, Depth: 1, Offset: 541, Size: 49280) [Ars Technica]
594
30
            TBS Type: 110 (6)
595
31
            Outer Index entry: 0
596
32
            Unknown (vwi: always 0?): 0
597
33
            Unknown (byte: always 2?): 2
598
34
599
35
    3. If it has both the section 1 node and at least one article node, TBS of type 6, like this::
600
36
601
37
            Record #1: Starts at: 0 Ends at: 4095
602
38
                Contains: 4 index entries (0 ends, 1 complete, 3 starts)
603
39
            TBS bytes: 86 80 2 c4 2
604
40
                Complete:
605
41
                    Index Entry: 5 (Parent index: 1, Depth: 2, Offset: 549, Size: 1866) [Week in gaming: 3DS review, Crysis 2, George Hotz]
606
42
                Starts:
607
43
                    Index Entry: 0 (Parent index: -1, Depth: 0, Offset: 215, Size: 79253) [j_x's Google reader]
608
44
                    Index Entry: 1 (Parent index: 0, Depth: 1, Offset: 541, Size: 35279) [Ars Technica]
609
45
                    Index Entry: 6 (Parent index: 1, Depth: 2, Offset: 2415, Size: 2764) [Week in Apple: ZFS on Mac OS X, rogue tethering, DUI apps, and more]
610
46
            TBS Type: 110 (6)
611
47
            Outer Index entry: 0
612
48
            Unknown (vwi: always 0?): 0
613
49
            Unknown (byte: always 2?): 2
614
50
            Article index at start of record or first article index, relative to parent section (fvwi): 4 [5 absolute]
615
51
            Number of article nodes in the record (byte): 2
616
52
617
53
        If there was only a single article, instead of 2, then the last two bytes would be: c0, i.e. there would be no byte giving the number of articles in the record.
618
54
619
55
620
56
Records with no nodes
621
57
------------------------
622
58
623
59
These records are spanned by a single article. They are of two types:
624
60
625
61
    1. If the parent section index is 1, TBS type of 6, like this::
626
62
627
63
            Record #4: Starts at: 12288 Ends at: 16383
628
64
                Contains: 0 index entries (0 ends, 0 complete, 0 starts)
629
65
            TBS bytes: 86 80 2 c1 80
630
66
            TBS Type: 110 (6)
631
67
            Outer Index entry: 0
632
68
            Unknown (vwi: always 0?): 0
633
69
            Unknown (byte: always 2?): 2
634
70
            Article index at start of record or first article index, relative to parent section (fvwi): 4 [5 absolute]
635
71
            EOF (vwi: should be 0): 0
636
72
637
73
        If the record is before the first article, the TBS bytes would be: 86 80 2
638
74
639
75
    2. If the parent section index is > 1, TBS type of 2, like this::
640
76
641
77
            Record #14: Starts at: 53248 Ends at: 57343
642
78
                Contains: 0 index entries (0 ends, 0 complete, 0 starts)
643
79
            TBS bytes: 82 80 a0 1 e1 80
644
80
            TBS Type: 010 (2)
645
81
            Outer Index entry: 0
646
82
            Unknown (vwi: always 0?): 0
647
83
            Parent section index (fvwi): 2
648
84
            Flags: 0
649
85
            Article index at start of record or first article index, relative to parent section (fvwi): 14 [16 absolute]
650
86
            EOF (vwi: should be 0): 0
651
87
652
88
Records with only article nodes
653
89
-----------------------------------
654
90
655
91
Such records have no section transitions (i.e. a section end/section start pair). They have only one or more article nodes. They are of two types:
656
92
657
93
    1. If the parent section index is 1, TBS type of 7, like this::
658
94
659
95
            Record #6: Starts at: 20480 Ends at: 24575
660
96
                Contains: 2 index entries (1 ends, 0 complete, 1 starts)
661
97
            TBS bytes: 87 80 2 80 1 84 2
662
98
                Ends:
663
99
                    Index Entry: 9 (Parent index: 1, Depth: 2, Offset: 16453, Size: 4199) [Vaccine's success spurs whooping cough comeback]
664
100
                Starts:
665
101
                    Index Entry: 10 (Parent index: 1, Depth: 2, Offset: 20652, Size: 4246) [Apple's mobile products do not violate Nokia patents, says ITC]
666
102
            TBS Type: 111 (7)
667
103
            Outer Index entry: 0
668
104
            Unknown (vwi: always 0?): 0
669
105
            Unknown: '\x02\x80' (vwi?: Always 256)
670
106
            Article at start of record (fvwi): 8
671
107
            Number of articles in record (byte): 2
672
108
673
109
        If there was only one article in the record, the last two bytes would be replaced by a single byte: 80
674
110
675
111
        If this record is the first record with an article, then the article at the start of the record should be the last section index. At least, that's what kindlegen does, though if you ask me, it should be the first section index.
676
112
677
113
678
114
    2. If the parent section index is > 1, TBS type of 2, like this::
679
115
680
116
            Record #16: Starts at: 61440 Ends at: 65535
681
117
                Contains: 5 index entries (1 ends, 3 complete, 1 starts)
682
118
            TBS bytes: 82 80 a1 80 1 f4 5
683
119
                Ends:
684
120
                    Index Entry: 17 (Parent index: 2, Depth: 2, Offset: 60920, Size: 1082) [Microsoft's Joe Belfiore still working on upcoming Zune hardware]
685
121
                Complete:
686
122
                    Index Entry: 18 (Parent index: 2, Depth: 2, Offset: 62002, Size: 1016) [Rumour: OS X Lion nearing Golden Master stage]
687
123
                    Index Entry: 19 (Parent index: 2, Depth: 2, Offset: 63018, Size: 1045) [iOS 4.3.1 released]
688
124
                    Index Entry: 20 (Parent index: 2, Depth: 2, Offset: 64063, Size: 972) [Windows 8 'system reset' image leaks]
689
125
                Starts:
690
126
                    Index Entry: 21 (Parent index: 2, Depth: 2, Offset: 65035, Size: 1057) [Windows Phone 7: Why it's failing]
691
127
            TBS Type: 010 (2)
692
128
            Outer Index entry: 0
693
129
            Unknown (vwi: always 0?): 0
694
130
            Parent section index (fvwi) : 2
695
131
            Flags: 1
696
132
            Unknown (vwi: always 0?): 0
697
133
            Article index at start of record or first article index, relative to parent section (fvwi): 15 [17 absolute]
698
134
            Number of article nodes in the record (byte): 5
699
135
700
136
        If there was only one article in the record, the last two bytes would be replaced by a single byte: f0
701
137
702
138
Records with a section transition
703
139
-----------------------------------
704
140
705
141
In such a record there is a transition from one section to the next. As such the record must have at least one article ending and one article starting, except in the case of the first section.
706
142
707
143
TODO: Note you have to test the cases of first section, a single transition and multiple transitions.
708
144
709
145
    1. The first section::
710
146
711
147
        Record #2: Starts at: 4096 Ends at: 8191
712
148
            Contains: 2 index entries (0 ends, 0 complete, 2 starts)
713
149
        TBS bytes: 83 80 80 90 c0
714
150
            Starts:
715
151
                Index Entry: 1 (Parent index: 0, Depth: 1, Offset: 7758, Size: 26279) [Ars Technica]
716
152
                Index Entry: 5 (Parent index: 1, Depth: 2, Offset: 7766, Size: 1866) [Week in gaming: 3DS review, Crysis 2, George Hotz]
717
153
        TBS Type: 011 (3)
718
154
        Outer Index entry: 0
719
155
        Unknown (vwi: always 0?): 0
720
156
        Unknown (vwi: always 0?): 0
721
157
        First section index (fvwi) : 1
722
158
        Extra bits: 0
723
159
        First section starts
724
160
        Article at start of block as offset from parent index (fvwi): 4 [5 absolute]
725
161
        Flags: 0
726
162
727
163
    If there was more than one article at the start then the last byte would be replaced by: c4 n where n is the number of articles
728
164
729
165
730
166
Ending record
731
167
----------------
732
168
733
169
Logically, ending records must have at least one article ending, one section ending and the periodical ending. They are of TBS type 2, like this::
734
170
735
171
    Record #17: Starts at: 65536 Ends at: 68684
736
172
        Contains: 4 index entries (3 ends, 1 complete, 0 starts)
737
173
    TBS bytes: 82 80 c0 4 f4 2
738
174
        Ends:
739
175
            Index Entry: 0 (Parent index: -1, Depth: 0, Offset: 215, Size: 68470) [j_x's Google reader]
740
176
            Index Entry: 4 (Parent index: 0, Depth: 1, Offset: 51234, Size: 17451) [Slashdot]
741
177
            Index Entry: 43 (Parent index: 4, Depth: 2, Offset: 65422, Size: 1717) [US ITC May Reverse Judge&#39;s Ruling In Kodak vs. Apple]
742
178
        Complete:
743
179
            Index Entry: 44 (Parent index: 4, Depth: 2, Offset: 67139, Size: 1546) [Google Starts Testing Google Music Internally]
744
180
    TBS Type: 010 (2)
745
181
    Outer Index entry: 0
746
182
    Unknown (vwi: always 0?): 0
747
183
    Parent section index (fvwi): 4
748
184
    Flags: 0
749
185
    Article at start of block as offset from parent index (fvwi): 39 [43 absolute]
750
186
    Number of nodes (byte): 2
751
187
752
188
If the record had only a single article end, the last two bytes would be replaced with: f0
753
189
754
0
190
755
=== modified file 'src/calibre/ebooks/mobi/utils.py'
756
--- src/calibre/ebooks/mobi/utils.py	2011-07-20 20:01:41 +0000
757
+++ src/calibre/ebooks/mobi/utils.py	2011-07-22 18:03:36 +0000
758
@@ -79,7 +79,7 @@
759
79
79
760
80
def decint(raw, forward=True):
80
def decint(raw, forward=True):
761
81
    '''
81
    '''
763
82
    Read a variable width integer from the bytestring raw and return the
82
    Read a variable width integer from the bytestring or bytearray raw and return the
764
83
    integer and the number of bytes read. If forward is True bytes are read
83
    integer and the number of bytes read. If forward is True bytes are read
765
84
    from the start of raw, otherwise from the end of raw.
84
    from the start of raw, otherwise from the end of raw.
766
85
85
767
@@ -88,8 +88,10 @@
768
88
    '''
88
    '''
769
89
    val = 0
89
    val = 0
770
90
    byts = bytearray()
90
    byts = bytearray()
773
91
    for byte in raw if forward else reversed(raw):
91
    src = bytearray(raw)
774
92
        bnum = ord(byte)
92
    if not forward:
775
93
        src.reverse()
776
94
    for bnum in src:
777
93
        byts.append(bnum & 0b01111111)
95
        byts.append(bnum & 0b01111111)
778
94
        if bnum & 0b10000000:
96
        if bnum & 0b10000000:
779
95
            break
97
            break
780
96
98
781
=== modified file 'src/calibre/gui2/store/stores/chitanka_plugin.py'
782
--- src/calibre/gui2/store/stores/chitanka_plugin.py	2011-07-19 06:16:55 +0000
783
+++ src/calibre/gui2/store/stores/chitanka_plugin.py	2011-07-22 18:03:36 +0000
784
@@ -55,36 +55,21 @@
785
55
                if counter <= 0:
55
                if counter <= 0:
786
56
                    break
56
                    break
787
57
57
789
58
                id = ''.join(data.xpath('.//a[@class="booklink"]/@href'))
58
                id = ''.join(data.xpath('.//a[@class="booklink"]/@href')).strip()
790
59
                if not id:
59
                if not id:
791
60
                    continue
60
                    continue
792
61
61
793
62
                cover_url = ''.join(data.xpath('.//a[@class="booklink"]/img/@src'))
794
63
                title = ''.join(data.xpath('.//a[@class="booklink"]/i/text()'))
795
64
                author = ''.join(data.xpath('.//span[@class="bookauthor"]/a/text()'))
796
65
                fb2 = ''.join(data.xpath('.//a[@class="dl dl-fb2"]/@href'))
797
66
                epub = ''.join(data.xpath('.//a[@class="dl dl-epub"]/@href'))
798
67
                txt = ''.join(data.xpath('.//a[@class="dl dl-txt"]/@href'))
799
68
800
69
                # remove .zip extensions
801
70
                if fb2.find('.zip') != -1:
802
71
                    fb2 = fb2[:fb2.find('.zip')]
803
72
                if epub.find('.zip') != -1:
804
73
                    epub = epub[:epub.find('.zip')]
805
74
                if txt.find('.zip') != -1:
806
75
                    txt = txt[:txt.find('.zip')]
807
76
808
77
                counter -= 1
62
                counter -= 1
809
78
63
810
79
                s = SearchResult()
64
                s = SearchResult()
815
80
                s.cover_url = cover_url
65
                s.cover_url = ''.join(data.xpath('.//a[@class="booklink"]/img/@src')).strip()
816
81
                s.title = title.strip()
66
                s.title = ''.join(data.xpath('.//a[@class="booklink"]/i/text()')).strip()
817
82
                s.author = author.strip()
67
                s.author = ''.join(data.xpath('.//span[@class="bookauthor"]/a/text()')).strip()
818
83
                s.detail_item = id.strip()
68
                s.detail_item = id
819
84
                s.drm = SearchResult.DRM_UNLOCKED
69
                s.drm = SearchResult.DRM_UNLOCKED
823
85
                s.downloads['FB2'] = base_url + fb2.strip()
70
                s.downloads['FB2'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-fb2"]/@href')).strip().replace('.zip', '')
824
86
                s.downloads['EPUB'] = base_url + epub.strip()
71
                s.downloads['EPUB'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-epub"]/@href')).strip().replace('.zip', '')
825
87
                s.downloads['TXT'] = base_url + txt.strip()
72
                s.downloads['TXT'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-txt"]/@href')).strip().replace('.zip', '')
826
88
                s.formats = 'FB2, EPUB, TXT, SFB'
73
                s.formats = 'FB2, EPUB, TXT, SFB'
827
89
                yield s
74
                yield s
828
90
75
829
@@ -106,35 +91,20 @@
830
106
                    if counter <= 0:
91
                    if counter <= 0:
831
107
                        break
92
                        break
832
108
93
834
109
                    id = ''.join(data.xpath('.//a[@class="booklink"]/@href'))
94
                    id = ''.join(data.xpath('.//a[@class="booklink"]/@href')).strip()
835
110
                    if not id:
95
                    if not id:
836
111
                        continue
96
                        continue
837
112
97
838
113
                    cover_url = ''.join(data.xpath('.//a[@class="booklink"]/img/@src'))
839
114
                    title = ''.join(data.xpath('.//a[@class="booklink"]/i/text()'))
840
115
                    author = ''.join(data.xpath('.//span[@class="bookauthor"]/a/text()'))
841
116
                    fb2 = ''.join(data.xpath('.//a[@class="dl dl-fb2"]/@href'))
842
117
                    epub = ''.join(data.xpath('.//a[@class="dl dl-epub"]/@href'))
843
118
                    txt = ''.join(data.xpath('.//a[@class="dl dl-txt"]/@href'))
844
119
845
120
                    # remove .zip extensions
846
121
                    if fb2.find('.zip') != -1:
847
122
                        fb2 = fb2[:fb2.find('.zip')]
848
123
                    if epub.find('.zip') != -1:
849
124
                        epub = epub[:epub.find('.zip')]
850
125
                    if txt.find('.zip') != -1:
851
126
                        txt = txt[:txt.find('.zip')]
852
127
853
128
                    counter -= 1
98
                    counter -= 1
854
129
99
855
130
                    s = SearchResult()
100
                    s = SearchResult()
860
131
                    s.cover_url = cover_url
101
                    s.cover_url = ''.join(data.xpath('.//a[@class="booklink"]/img/@src')).strip()
861
132
                    s.title = title.strip()
102
                    s.title = ''.join(data.xpath('.//a[@class="booklink"]/i/text()')).strip()
862
133
                    s.author = author.strip()
103
                    s.author = ''.join(data.xpath('.//span[@class="bookauthor"]/a/text()')).strip()
863
134
                    s.detail_item = id.strip()
104
                    s.detail_item = id
864
135
                    s.drm = SearchResult.DRM_UNLOCKED
105
                    s.drm = SearchResult.DRM_UNLOCKED
868
136
                    s.downloads['FB2'] = base_url + fb2.strip()
106
                    s.downloads['FB2'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-fb2"]/@href')).strip().replace('.zip', '')
869
137
                    s.downloads['EPUB'] = base_url + epub.strip()
107
                    s.downloads['EPUB'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-epub"]/@href')).strip().replace('.zip', '')
870
138
                    s.downloads['TXT'] = base_url + txt.strip()
108
                    s.downloads['TXT'] = base_url + ''.join(data.xpath('.//a[@class="dl dl-txt"]/@href')).strip().replace('.zip', '')
871
139
                    s.formats = 'FB2, EPUB, TXT, SFB'
109
                    s.formats = 'FB2, EPUB, TXT, SFB'
872
140
                    yield s
110
                    yield s
873
141
111
874
=== added file 'src/calibre/gui2/store/stores/eknigi_plugin.py'
875
--- src/calibre/gui2/store/stores/eknigi_plugin.py	1970-01-01 00:00:00 +0000
876
+++ src/calibre/gui2/store/stores/eknigi_plugin.py	2011-07-22 18:03:36 +0000
877
@@ -0,0 +1,88 @@
878
1
# -*- coding: utf-8 -*-
879
2
880
3
from __future__ import (unicode_literals, division, absolute_import, print_function)
881
4
882
5
__license__ = 'GPL 3'
883
6
__copyright__ = '2011, Alex Stanev <alex@stanev.org>'
884
7
__docformat__ = 'restructuredtext en'
885
8
886
9
import random
887
10
import urllib2
888
11
from contextlib import closing
889
12
890
13
from lxml import html
891
14
892
15
from PyQt4.Qt import QUrl
893
16
894
17
from calibre import browser, url_slash_cleaner
895
18
from calibre.gui2 import open_url
896
19
from calibre.gui2.store import StorePlugin
897
20
from calibre.gui2.store.basic_config import BasicStoreConfig
898
21
from calibre.gui2.store.search_result import SearchResult
899
22
from calibre.gui2.store.web_store_dialog import WebStoreDialog
900
23
901
24
class eKnigiStore(BasicStoreConfig, StorePlugin):
902
25
903
26
    def open(self, parent=None, detail_item=None, external=False):
904
27
        # Use Kovid's affiliate id 30% of the time
905
28
        if random.randint(1, 10) in (1, 2, 3):
906
29
            aff_suffix = '&amigosid=23'
907
30
        else:
908
31
            aff_suffix = '&amigosid=22'
909
32
        url = 'http://e-knigi.net/?' + aff_suffix[1:]
910
33
911
34
        if external or self.config.get('open_external', False):
912
35
            if detail_item:
913
36
                url = detail_item + aff_suffix
914
37
            open_url(QUrl(url_slash_cleaner(url)))
915
38
        else:
916
39
            detail_url = None
917
40
            if detail_item:
918
41
                url = detail_item + aff_suffix
919
42
            d = WebStoreDialog(self.gui, url, parent, detail_url)
920
43
            d.setWindowTitle(self.name)
921
44
            d.set_tags(self.config.get('tags', ''))
922
45
            d.exec_()
923
46
924
47
    def search(self, query, max_results=10, timeout=60):
925
48
        base_url = 'http://e-knigi.net'
926
49
        url = base_url + '/virtuemart?page=shop.browse&search_category=0&search_limiter=anywhere&limitstart=0&limit=' + str(max_results) + '&keyword=' + urllib2.quote(query)
927
50
928
51
        br = browser()
929
52
930
53
        counter = max_results
931
54
        with closing(br.open(url, timeout=timeout)) as f:
932
55
            doc = html.fromstring(f.read())
933
56
934
57
            # if the store finds only one product, it opens directly detail view
935
58
            for data in doc.xpath('//div[@class="prod_details"]'):
936
59
                s = SearchResult()
937
60
                s.cover_url = ''.join(data.xpath('.//div[@class="vm_main_info clearfix"]/div[@class="lf"]/a/img/@src')).strip()
938
61
                s.title = ''.join(data.xpath('.//div[@class="vm_main_info clearfix"]/div[@class="lf"]/a/img/@alt')).strip()
939
62
                s.author = ''.join(data.xpath('.//div[@class="td_bg clearfix"]/div[@class="gk_product_tab"]/div/table/tr[3]/td[2]/text()')).strip()
940
63
                s.price = ''.join(data.xpath('.//span[@class="productPrice"]/text()')).strip()
941
64
                s.detail_item = url
942
65
                s.drm = SearchResult.DRM_UNLOCKED
943
66
944
67
                yield s
945
68
                return
946
69
947
70
            # search in store results
948
71
            for data in doc.xpath('//div[@class="browseProductContainer"]'):
949
72
                if counter <= 0:
950
73
                    break
951
74
                id = ''.join(data.xpath('.//a[1]/@href')).strip()
952
75
                if not id:
953
76
                    continue
954
77
955
78
                counter -= 1
956
79
957
80
                s = SearchResult()
958
81
                s.cover_url = ''.join(data.xpath('.//a[@class="gk_vm_product_image"]/img/@src')).strip()
959
82
                s.title = ''.join(data.xpath('.//a[@class="gk_vm_product_image"]/img/@title')).strip()
960
83
                s.author = ''.join(data.xpath('.//div[@style="float:left;width:90%"]/b/text()')).strip().replace('Автор: ', '')
961
84
                s.price = ''.join(data.xpath('.//span[@class="productPrice"]/text()')).strip()
962
85
                s.detail_item = base_url + id
963
86
                s.drm = SearchResult.DRM_UNLOCKED
964
87
965
88
                yield s
966
0
89
967
=== modified file 'src/calibre/translations/msgfmt.py'
968
--- src/calibre/translations/msgfmt.py	2008-05-02 16:41:12 +0000
969
+++ src/calibre/translations/msgfmt.py	2011-07-22 18:03:36 +0000
970
@@ -1,20 +1,39 @@
971
1
#! /usr/bin/env python
1
#! /usr/bin/env python
972
2
# Written by Martin v. Loewis <loewis@informatik.hu-berlin.de>
2
# Written by Martin v. Loewis <loewis@informatik.hu-berlin.de>
973
3
# Modified by Kovid Goyal <kovid@kovidgoyal.net>
974
4
3
975
5
"""Generate binary message catalog from textual translation description.
4
"""Generate binary message catalog from textual translation description.
976
6
5
977
7
This program converts a textual Uniforum-style message catalog (.po file) into
6
This program converts a textual Uniforum-style message catalog (.po file) into
978
8
a binary GNU catalog (.mo file).  This is essentially the same function as the
7
a binary GNU catalog (.mo file).  This is essentially the same function as the
979
9
GNU msgfmt program, however, it is a simpler implementation.
8
GNU msgfmt program, however, it is a simpler implementation.
980
9
981
10
Usage: msgfmt.py [OPTIONS] filename.po
982
11
983
12
Options:
984
13
    -o file
985
14
    --output-file=file
986
15
        Specify the output file to write to.  If omitted, output will go to a
987
16
        file named filename.mo (based off the input file name).
988
17
989
18
    -h
990
19
    --help
991
20
        Print this message and exit.
992
21
993
22
    -V
994
23
    --version
995
24
        Display version information and exit.
996
10
"""
25
"""
997
11
26
998
12
import sys
27
import sys
999
13
import os
28
import os
1000
29
import getopt
1001
14
import struct
30
import struct
1002
15
import array
31
import array
1003
16
32
1005
17
__version__ = "1.2"
33
__version__ = "1.1"
1006
34
1007
35
MESSAGES = {}
1008
36
1009
18
37
1010
19
def usage(code, msg=''):
38
def usage(code, msg=''):
1011
20
    print >> sys.stderr, __doc__
39
    print >> sys.stderr, __doc__
1012
@@ -23,16 +42,16 @@
1013
23
    sys.exit(code)
42
    sys.exit(code)
1014
24
43
1015
25
44
1018
26
45
def add(id, str, fuzzy):
1017
27
def add(id, str, fuzzy, MESSAGES):
1019
28
    "Add a non-fuzzy translation to the dictionary."
46
    "Add a non-fuzzy translation to the dictionary."
1020
47
    global MESSAGES
1021
29
    if not fuzzy and str:
48
    if not fuzzy and str:
1022
30
        MESSAGES[id] = str
49
        MESSAGES[id] = str
1023
31
50
1024
32
51
1027
33
52
def generate():
1026
34
def generate(MESSAGES):
1028
35
    "Return the generated output."
53
    "Return the generated output."
1029
54
    global MESSAGES
1030
36
    keys = MESSAGES.keys()
55
    keys = MESSAGES.keys()
1031
37
    # the keys are sorted in the .mo file
56
    # the keys are sorted in the .mo file
1032
38
    keys.sort()
57
    keys.sort()
1033
@@ -44,6 +63,7 @@
1034
44
        offsets.append((len(ids), len(id), len(strs), len(MESSAGES[id])))
63
        offsets.append((len(ids), len(id), len(strs), len(MESSAGES[id])))
1035
45
        ids += id + '\0'
64
        ids += id + '\0'
1036
46
        strs += MESSAGES[id] + '\0'
65
        strs += MESSAGES[id] + '\0'
1037
66
    output = ''
1038
47
    # The header is 7 32-bit unsigned integers.  We don't use hash tables, so
67
    # The header is 7 32-bit unsigned integers.  We don't use hash tables, so
1039
48
    # the keys start right after the index tables.
68
    # the keys start right after the index tables.
1040
49
    # translated string.
69
    # translated string.
1041
@@ -71,9 +91,7 @@
1042
71
    return output
91
    return output
1043
72
92
1044
73
93
1045
74
1046
75
def make(filename, outfile):
94
def make(filename, outfile):
1047
76
    MESSAGES = {}
1048
77
    ID = 1
95
    ID = 1
1049
78
    STR = 2
96
    STR = 2
1050
79
97
1051
@@ -101,7 +119,7 @@
1052
101
        lno += 1
119
        lno += 1
1053
102
        # If we get a comment line after a msgstr, this is a new entry
120
        # If we get a comment line after a msgstr, this is a new entry
1054
103
        if l[0] == '#' and section == STR:
121
        if l[0] == '#' and section == STR:
1056
104
            add(msgid, msgstr, fuzzy, MESSAGES)
122
            add(msgid, msgstr, fuzzy)
1057
105
            section = None
123
            section = None
1058
106
            fuzzy = 0
124
            fuzzy = 0
1059
107
        # Record a fuzzy mark
125
        # Record a fuzzy mark
1060
@@ -111,16 +129,39 @@
1061
111
        if l[0] == '#':
129
        if l[0] == '#':
1062
112
            continue
130
            continue
1063
113
        # Now we are in a msgid section, output previous section
131
        # Now we are in a msgid section, output previous section
1065
114
        if l.startswith('msgid'):
132
        if l.startswith('msgid') and not l.startswith('msgid_plural'):
1066
115
            if section == STR:
133
            if section == STR:
1068
116
                add(msgid, msgstr, fuzzy, MESSAGES)
134
                add(msgid, msgstr, fuzzy)
1069
117
            section = ID
135
            section = ID
1070
118
            l = l[5:]
136
            l = l[5:]
1071
119
            msgid = msgstr = ''
137
            msgid = msgstr = ''
1072
138
            is_plural = False
1073
139
        # This is a message with plural forms
1074
140
        elif l.startswith('msgid_plural'):
1075
141
            if section != ID:
1076
142
                print >> sys.stderr, 'msgid_plural not preceeded by msgid on %s:%d' %\
1077
143
                    (infile, lno)
1078
144
                sys.exit(1)
1079
145
            l = l[12:]
1080
146
            msgid += '\0' # separator of singular and plural
1081
147
            is_plural = True
1082
120
        # Now we are in a msgstr section
148
        # Now we are in a msgstr section
1083
121
        elif l.startswith('msgstr'):
149
        elif l.startswith('msgstr'):
1084
122
            section = STR
150
            section = STR
1086
123
            l = l[6:]
151
            if l.startswith('msgstr['):
1087
152
                if not is_plural:
1088
153
                    print >> sys.stderr, 'plural without msgid_plural on %s:%d' %\
1089
154
                        (infile, lno)
1090
155
                    sys.exit(1)
1091
156
                l = l.split(']', 1)[1]
1092
157
                if msgstr:
1093
158
                    msgstr += '\0' # Separator of the various plural forms
1094
159
            else:
1095
160
                if is_plural:
1096
161
                    print >> sys.stderr, 'indexed msgstr required for plural on  %s:%d' %\
1097
162
                        (infile, lno)
1098
163
                    sys.exit(1)
1099
164
                l = l[6:]
1100
124
        # Skip empty lines
165
        # Skip empty lines
1101
125
        l = l.strip()
166
        l = l.strip()
1102
126
        if not l:
167
        if not l:
1103
@@ -138,22 +179,40 @@
1104
138
            sys.exit(1)
179
            sys.exit(1)
1105
139
    # Add last entry
180
    # Add last entry
1106
140
    if section == STR:
181
    if section == STR:
1108
141
        add(msgid, msgstr, fuzzy, MESSAGES)
182
        add(msgid, msgstr, fuzzy)
1109
142
183
1110
143
    # Compute output
184
    # Compute output
1113
144
    output = generate(MESSAGES)
185
    output = generate()
1114
145
186
1115
187
    outfile.write(output)
1116
188
1117
189
1118
190
def main():
1119
146
    try:
191
    try:
1127
147
        outfile.write(output)
192
        opts, args = getopt.getopt(sys.argv[1:], 'hVo:',
1128
148
    except IOError,msg:
193
                                   ['help', 'version', 'output-file='])
1129
149
        print >> sys.stderr, msg
194
    except getopt.error, msg:
1130
150
195
        usage(1, msg)
1131
151
196
1132
152
197
    outfile = None
1133
153
def main(outfile, args=sys.argv[1:]):
198
    # parse options
1134
199
    for opt, arg in opts:
1135
200
        if opt in ('-h', '--help'):
1136
201
            usage(0)
1137
202
        elif opt in ('-V', '--version'):
1138
203
            print >> sys.stderr, "msgfmt.py", __version__
1139
204
            sys.exit(0)
1140
205
        elif opt in ('-o', '--output-file'):
1141
206
            outfile = arg
1142
207
    # do it
1143
208
    if not args:
1144
209
        print >> sys.stderr, 'No input file given'
1145
210
        print >> sys.stderr, "Try `msgfmt --help' for more information."
1146
211
        return
1147
212
1148
154
    for filename in args:
213
    for filename in args:
1149
155
        make(filename, outfile)
214
        make(filename, outfile)
1151
156
    return 0
215
1152
157
216
1153
158
if __name__ == '__main__':
217
if __name__ == '__main__':
1155
159
    sys.exit(main(sys.stdout))
218
    main()
1156
160
219
1157
=== modified file 'src/calibre/utils/localization.py'
1158
--- src/calibre/utils/localization.py	2011-07-14 22:55:58 +0000
1159
+++ src/calibre/utils/localization.py	2011-07-22 18:03:36 +0000
1160
@@ -71,13 +71,13 @@
1161
71
    lang = get_lang()
71
    lang = get_lang()
1162
72
    if lang:
72
    if lang:
1163
73
        buf = iso639 = None
73
        buf = iso639 = None
1165
74
        if os.access(lang+'.po', os.R_OK):
74
        mpath = get_lc_messages_path(lang)
1166
75
        if mpath and os.access(mpath+'.po', os.R_OK):
1167
75
            from calibre.translations.msgfmt import make
76
            from calibre.translations.msgfmt import make
1168
76
            buf = cStringIO.StringIO()
77
            buf = cStringIO.StringIO()
1170
77
            make(lang+'.po', buf)
78
            make(mpath+'.po', buf)
1171
78
            buf = cStringIO.StringIO(buf.getvalue())
79
            buf = cStringIO.StringIO(buf.getvalue())
1172
79
80
1173
80
        mpath = get_lc_messages_path(lang)
1174
81
        if mpath is not None:
81
        if mpath is not None:
1175
82
            with ZipFile(P('localization/locales.zip',
82
            with ZipFile(P('localization/locales.zip',
1176
83
                allow_user_override=False), 'r') as zf:
83
                allow_user_override=False), 'r') as zf:
1177
84
84
1178
=== modified file 'src/calibre/web/feeds/recipes/model.py'
1179
--- src/calibre/web/feeds/recipes/model.py	2011-06-25 04:47:59 +0000
1180
+++ src/calibre/web/feeds/recipes/model.py	2011-07-22 18:03:36 +0000
1181
@@ -217,6 +217,8 @@
1182
217
            self.all_urns.add(urn)
217
            self.all_urns.add(urn)
1183
218
            if ok(urn):
218
            if ok(urn):
1184
219
                lang = x.get('language', 'und')
219
                lang = x.get('language', 'und')
1185
220
                if lang:
1186
221
                    lang = lang.replace('-', '_')
1187
220
                if lang not in lang_map:
222
                if lang not in lang_map:
1188
221
                    lang_map[lang] = factory(NewsCategory, new_root, lang)
223
                    lang_map[lang] = factory(NewsCategory, new_root, lang)
1189
222
                factory(NewsItem, lang_map[lang], urn, x.get('title'))
224
                factory(NewsItem, lang_map[lang], urn, x.get('title'))
Status:	Merged
Merged at revision:	8446
Proposed branch:	lp:~realender/calibre/calibre
Merge into:	lp:~user-none/calibre/store
Diff against target:	1189 lines (+803/-91) 14 files modified recipes/idg_se.recipe (+33/-0) recipes/united_daily.recipe (+1/-1) recipes/utrinski.recipe (+71/-0) src/calibre/customize/builtins.py (+11/-0) src/calibre/devices/android/driver.py (+5/-3) src/calibre/devices/eb600/driver.py (+3/-3) src/calibre/ebooks/mobi/debug.py (+293/-8) src/calibre/ebooks/mobi/tbs_periodicals.rst (+189/-0) src/calibre/ebooks/mobi/utils.py (+5/-3) src/calibre/gui2/store/stores/chitanka_plugin.py (+16/-46) src/calibre/gui2/store/stores/eknigi_plugin.py (+88/-0) src/calibre/translations/msgfmt.py (+83/-24) src/calibre/utils/localization.py (+3/-3) src/calibre/web/feeds/recipes/model.py (+2/-0)
To merge this branch:	bzr merge lp:~realender/calibre/calibre
Related bugs:	Link a bug report
Reviewer	Review Type	Date Requested	Status
John Schember		2011-07-20	Pending
Review via email: mp+68588@code.launchpad.net