forked from Nandaka/PixivUtil2
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathPixivTags.py
118 lines (99 loc) · 4.04 KB
/
PixivTags.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
# -*- coding: utf-8 -*-
# pylint: disable=I0011, C, C0302
import json
import os
import re
import PixivHelper
from PixivException import PixivException
class PixivTagsItem:
imageId: int = 0
bookmarkCount: int = 0
imageResponse: int = 0
ai_type: int = -1
def __init__(self, image_id, bookmark_count, image_response_count, ai_type=-1):
self.imageId = image_id
self.bookmarkCount = bookmark_count
self.imageResponse = image_response_count
self.ai_type = ai_type
class PixivTags:
'''Class for parsing tags search page'''
itemList = None
haveImage = None
isLastPage = None
availableImages = 0
# __re_illust = re.compile(r'member_illust.*illust_id=(\d*)')
# __re_imageItemClass = re.compile(r".*\bimage-item\b.*")
query = ""
memberId = 0
POSTS_PER_PAGE = 60
page = -1
def parseMemberTags(self, artist, memberId, query=""):
'''process artist result and return the image list, https://www.pixiv.net/ajax/user/25661139/illustmanga/tag/<search_tags>'''
self.itemList = list()
self.memberId = memberId
self.query = query
self.haveImage = artist.haveImages
self.isLastPage = artist.isLastPage
for image in artist.imageList:
self.itemList.append(PixivTagsItem(int(image), 0, 0))
def parseTags(self, page, query="", curr_page=1):
'''From search by tags page, https://www.pixiv.net/ajax/search/artworks/<search_tags>'''
payload = json.loads(page)
self.query = query
self.page = curr_page
# check error
if payload["error"]:
raise PixivException(f'Image Error: {payload["message"]}', errorCode=PixivException.SERVER_ERROR)
# parse images information
self.itemList = list()
ad_container_count = 0
for item in payload["body"]["illustManga"]["data"]:
if "isAdContainer" in item and item["isAdContainer"]:
ad_container_count = ad_container_count + 1
continue
image_id = int(item["id"])
# like count not available anymore, need to call separate request...
bookmarkCount = 0
imageResponse = 0
ai_type = -1
if "aiType" in item:
ai_type = int(item["aiType"])
tag_item = PixivTagsItem(image_id, bookmarkCount, imageResponse, ai_type)
self.itemList.append(tag_item)
self.haveImage = False
if len(self.itemList) > 0:
self.haveImage = True
# search page info
self.availableImages = int(payload["body"]["illustManga"]["total"])
# assume it always return 60 images, including the advert
if len(self.itemList) + ad_container_count == PixivTags.POSTS_PER_PAGE:
self.isLastPage = False
else:
self.isLastPage = True
return self.itemList
def PrintInfo(self):
PixivHelper.safePrint('Search Result')
if self.memberId > 0:
PixivHelper.safePrint(f'Member Id: {self.memberId}')
PixivHelper.safePrint(f'Query: {self.query}')
PixivHelper.safePrint(f'haveImage : {self.haveImage}')
PixivHelper.safePrint(f'urls : {len(self.itemList)}')
for item in self.itemList:
print(f"\tImage Id: {item.imageId}\tFav Count:{item.bookmarkCount}")
PixivHelper.safePrint(f'total : {self.availableImages}')
PixivHelper.safePrint(f'last? : {self.isLastPage}')
@staticmethod
def parseTagsList(filename):
'''read tags.txt and return the tags list'''
tags = list()
if not os.path.exists(filename):
raise PixivException(f"File doesn't exists or no permission to read: {filename}", PixivException.FILE_NOT_EXISTS_OR_NO_PERMISSION)
reader = PixivHelper.open_text_file(filename)
for line in reader:
if line.startswith('#') or len(line) < 1:
continue
line = line.strip()
if len(line) > 0:
tags.append(line)
reader.close()
return tags