|
1
|
|
|
#!/usr/bin/env python |
|
2
|
|
|
# -*- coding: utf8 -*- |
|
3
|
|
|
# |
|
4
|
|
|
# bylist.py : related to sites that gives one RSS/Atom feed for |
|
5
|
|
|
# all the projects (such as freshcode.club) |
|
6
|
|
|
# |
|
7
|
|
|
# (C) Copyright 2016 - 2018 Olivier Delhomme |
|
8
|
|
|
# e-mail : [email protected] |
|
9
|
|
|
# |
|
10
|
|
|
# This program is free software; you can redistribute it and/or modify |
|
11
|
|
|
# it under the terms of the GNU General Public License as published by |
|
12
|
|
|
# the Free Software Foundation; either version 3, or (at your option) |
|
13
|
|
|
# any later version. |
|
14
|
|
|
# |
|
15
|
|
|
# This program is distributed in the hope that it will be useful, |
|
16
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
17
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
18
|
|
|
# GNU General Public License for more details. |
|
19
|
|
|
# |
|
20
|
|
|
# You should have received a copy of the GNU General Public License |
|
21
|
|
|
# along with this program; if not, write to the Free Software Foundation, |
|
22
|
|
|
# Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA. |
|
23
|
|
|
# |
|
24
|
|
|
import re |
|
25
|
|
|
import caches |
|
26
|
|
|
import common |
|
27
|
|
|
|
|
28
|
|
|
|
|
29
|
|
|
def cut_title_with_default_method(title): |
|
30
|
|
|
""" |
|
31
|
|
|
Cuts title with a default method and a fallback |
|
32
|
|
|
>>> cut_title_with_default_method('versions 1.3.2') |
|
33
|
|
|
('versions', '1.3.2') |
|
34
|
|
|
>>> cut_title_with_default_method('no_version_project') |
|
35
|
|
|
('no_version_project', '') |
|
36
|
|
|
""" |
|
37
|
|
|
|
|
38
|
|
|
try: |
|
39
|
|
|
(project, version) = title.strip().split(' ', 1) |
|
40
|
|
|
|
|
41
|
|
|
except ValueError: |
|
42
|
|
|
project = title.strip() |
|
43
|
|
|
version = '' |
|
44
|
|
|
|
|
45
|
|
|
return (project, version) |
|
46
|
|
|
|
|
47
|
|
|
# End of cut_title_with_default_method() function |
|
48
|
|
|
|
|
49
|
|
|
|
|
50
|
|
|
def cut_title_with_regex_method(title, regex): |
|
51
|
|
|
""" |
|
52
|
|
|
Cuts title using a regex. If it does not success |
|
53
|
|
|
fallback to default. |
|
54
|
|
|
>>> cut_title_with_regex_method('versions 1.3.2', '([\w]+)\s([\d\.]+)') |
|
55
|
|
|
('versions', '1.3.2', False) |
|
56
|
|
|
>>> cut_title_with_regex_method('versions 1.3.2', '([\w]+)notgood\s([\d\.]+)') |
|
57
|
|
|
('', '', True) |
|
58
|
|
|
""" |
|
59
|
|
|
|
|
60
|
|
|
default = False |
|
61
|
|
|
project = '' |
|
62
|
|
|
version = '' |
|
63
|
|
|
|
|
64
|
|
|
res = re.match(regex, title) |
|
65
|
|
|
if res: |
|
66
|
|
|
project = res.group(1) |
|
67
|
|
|
version = res.group(2) |
|
68
|
|
|
else: |
|
69
|
|
|
default = True |
|
70
|
|
|
|
|
71
|
|
|
return (project, version, default) |
|
72
|
|
|
|
|
73
|
|
|
# End of cut_title_with_regex_method() function |
|
74
|
|
|
|
|
75
|
|
|
|
|
76
|
|
|
def cut_title_in_project_version(title, regex): |
|
77
|
|
|
""" |
|
78
|
|
|
Cuts the title into a tuple (project, version) where possible with a regex |
|
79
|
|
|
or if there is no regex or the regex did not match cuts the title with a |
|
80
|
|
|
default method |
|
81
|
|
|
>>> cut_title_in_project_version('versions 1.3.2', None) |
|
82
|
|
|
('versions', '1.3.2') |
|
83
|
|
|
>>> cut_title_in_project_version('no_version_project', None) |
|
84
|
|
|
('no_version_project', '') |
|
85
|
|
|
>>> cut_title_in_project_version('versions 1.3.2', '([\w]+)badregex\s([\d\.]+)') |
|
86
|
|
|
('versions', '1.3.2') |
|
87
|
|
|
>>> cut_title_in_project_version('versions 1.3.2', '([\w]+)\s([\d\.i\-rcbetaRCBETA]+)') |
|
88
|
|
|
('versions', '1.3.2') |
|
89
|
|
|
""" |
|
90
|
|
|
default = False |
|
91
|
|
|
project = '' |
|
92
|
|
|
version = '' |
|
93
|
|
|
|
|
94
|
|
|
if regex is not None: |
|
95
|
|
|
(project, version, default) = cut_title_with_regex_method(title, regex) |
|
96
|
|
|
else: |
|
97
|
|
|
default = True |
|
98
|
|
|
|
|
99
|
|
|
if default: |
|
100
|
|
|
(project, version) = cut_title_with_default_method(title) |
|
101
|
|
|
|
|
102
|
|
|
return (project, version) |
|
103
|
|
|
|
|
104
|
|
|
# End of cut_title_in_project_version() function |
|
105
|
|
|
|
|
106
|
|
|
|
|
107
|
|
|
def lower_list_of_strings(project_list): |
|
108
|
|
|
""" |
|
109
|
|
|
Lowers every string in the list to ease sorting and comparisons |
|
110
|
|
|
>>> lower_list_of_strings(['TEST', 'LoweRed']) |
|
111
|
|
|
['test', 'lowered'] |
|
112
|
|
|
""" |
|
113
|
|
|
|
|
114
|
|
|
project_list_low = [project.lower() for project in project_list] |
|
115
|
|
|
|
|
116
|
|
|
return project_list_low |
|
117
|
|
|
|
|
118
|
|
|
# End of lower_list_of_strings() function |
|
119
|
|
|
|
|
120
|
|
|
|
|
121
|
|
|
def split_multiproject_title_into_list(title, multiproject): |
|
122
|
|
|
""" |
|
123
|
|
|
Splits title into a list of projects according to multiproject being |
|
124
|
|
|
a list of separators |
|
125
|
|
|
""" |
|
126
|
|
|
|
|
127
|
|
|
if multiproject is not None: |
|
128
|
|
|
titles = re.split(multiproject, title) |
|
129
|
|
|
else: |
|
130
|
|
|
titles = [title] |
|
131
|
|
|
|
|
132
|
|
|
return titles |
|
133
|
|
|
|
|
134
|
|
|
# End of split_multiproject_title_into_list() function |
|
135
|
|
|
|
|
136
|
|
|
|
|
137
|
|
|
def check_and_update_feed(feed_list, project_list, cache, debug, regex, multiproject): |
|
138
|
|
|
""" |
|
139
|
|
|
Checks every feed entry in the list against project list cache and |
|
140
|
|
|
then updates the dictionary then writes the cache file to the disk. |
|
141
|
|
|
- feed_list is a list of feed (from feedparser module) |
|
142
|
|
|
- project_list is the list of project as read from the yaml |
|
143
|
|
|
configuration file |
|
144
|
|
|
- cache is an initialized instance of FileCache |
|
145
|
|
|
""" |
|
146
|
|
|
|
|
147
|
|
|
# Lowers the list before searching in it |
|
148
|
|
|
project_list_low = lower_list_of_strings(project_list) |
|
149
|
|
|
|
|
150
|
|
|
# Checking every feed entry that are newer than the last check |
|
151
|
|
|
# and updates the dictionary accordingly |
|
152
|
|
|
for entry in feed_list: |
|
153
|
|
|
|
|
154
|
|
|
titles = split_multiproject_title_into_list(entry.title, multiproject) |
|
155
|
|
|
|
|
156
|
|
|
for title in titles: |
|
157
|
|
|
(project, version) = cut_title_in_project_version(title, regex) |
|
158
|
|
|
common.print_debug(debug, u'\tChecking {0:16}: {1}'.format(project, version)) |
|
159
|
|
|
if project.lower() in project_list_low: |
|
160
|
|
|
cache.print_if_newest_version(project, version, debug) |
|
161
|
|
|
cache.update_cache_dict(project, version, debug) |
|
162
|
|
|
|
|
163
|
|
|
cache.write_cache_file() |
|
164
|
|
|
|
|
165
|
|
|
# End of check_and_update_feed() function |
|
166
|
|
|
|
|
167
|
|
|
|
|
168
|
|
|
def check_versions_for_list_sites(feed_project_list, url, cache_filename, feed_filename, local_dir, debug, regex, multiproject): |
|
169
|
|
|
""" |
|
170
|
|
|
Checks projects of 'list' type sites such as freshcode's web site's RSS |
|
171
|
|
|
""" |
|
172
|
|
|
|
|
173
|
|
|
freshcode_cache = caches.FileCache(local_dir, cache_filename) |
|
174
|
|
|
|
|
175
|
|
|
feed_info = caches.FeedCache(local_dir, feed_filename) |
|
176
|
|
|
feed_info.read_cache_feed() |
|
177
|
|
|
|
|
178
|
|
|
feed = common.get_feed_entries_from_url(url) |
|
179
|
|
|
|
|
180
|
|
|
if feed is not None: |
|
181
|
|
|
common.print_debug(debug, u'\tFound {} entries'.format(len(feed.entries))) |
|
182
|
|
|
feed_list = common.make_list_of_newer_feeds(feed, feed_info, debug) |
|
183
|
|
|
common.print_debug(debug, u'\tFound {} new entries (relative to {})'.format(len(feed_list), feed_info.date_minutes)) |
|
184
|
|
|
|
|
185
|
|
|
check_and_update_feed(feed_list, feed_project_list, freshcode_cache, debug, regex, multiproject) |
|
186
|
|
|
|
|
187
|
|
|
# Updating feed_info with the latest parsed feed entry date |
|
188
|
|
|
feed_info.update_cache_feed(feed.entries[0].published_parsed) |
|
189
|
|
|
|
|
190
|
|
|
feed_info.write_cache_feed() |
|
191
|
|
|
|
|
192
|
|
|
# End of check_versions_for_list_sites() function |
|
193
|
|
|
|
|
194
|
|
|
|
|
195
|
|
|
def check_versions(versions_conf, list_site_list): |
|
196
|
|
|
""" |
|
197
|
|
|
Checks version by checking each project's feed. |
|
198
|
|
|
""" |
|
199
|
|
|
|
|
200
|
|
|
for site_name in list_site_list: |
|
201
|
|
|
common.print_debug(versions_conf.options.debug, u'Checking {} updates'.format(site_name)) |
|
202
|
|
|
(project_list, project_url, cache_filename, project_entry) = versions_conf.get_infos_for_site(site_name) |
|
203
|
|
|
regex = versions_conf.extract_regex_from_site(site_name) |
|
204
|
|
|
multiproject = versions_conf.extract_multiproject_from_site(site_name) |
|
205
|
|
|
feed_filename = u'{}.feed'.format(site_name) |
|
206
|
|
|
check_versions_for_list_sites(project_list, project_url, cache_filename, feed_filename, versions_conf.local_dir, versions_conf.options.debug, regex, multiproject) |
|
207
|
|
|
|
|
208
|
|
|
# End of check_versions() function |
|
209
|
|
|
|