1 # Fedi API Block - An aggregator for fetching blocking data from fediverse nodes
2 # Copyright (C) 2023 Free Software Foundation
4 # This program is free software: you can redistribute it and/or modify
5 # it under the terms of the GNU Affero General Public License as published
6 # by the Free Software Foundation, either version 3 of the License, or
7 # (at your option) any later version.
9 # This program is distributed in the hope that it will be useful,
10 # but WITHOUT ANY WARRANTY; without even the implied warranty of
11 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12 # GNU Affero General Public License for more details.
14 # You should have received a copy of the GNU Affero General Public License
15 # along with this program. If not, see <https://www.gnu.org/licenses/>.
20 from fba.helpers import blacklist
21 from fba.helpers import config
22 from fba.helpers import dicts as dict_helper
23 from fba.helpers import domain as domain_helper
24 from fba.helpers import tidyup
26 from fba.http import csrf
27 from fba.http import network
29 from fba.models import instances
31 logging.basicConfig(level=logging.INFO)
32 logger = logging.getLogger(__name__)
34 def fetch_peers(domain: str) -> list:
35 logger.debug("domain='%s' - CALLED!", domain)
36 domain_helper.raise_on(domain)
38 if blacklist.is_blacklisted(domain):
39 raise Exception(f"domain='{domain}' is blacklisted but function is invoked.")
41 logger.debug("domain='%s' is misskey, sending API POST request ...", domain)
44 step = config.get("misskey_limit")
46 # No CSRF by default, you don't have to add network.api_headers by yourself here
50 logger.debug("Checking CSRF for domain='%s'", domain)
51 headers = csrf.determine(domain, dict())
52 except network.exceptions as exception:
53 logger.warning("Exception '%s' during checking CSRF (fetch_peers,%s)", type(exception), __name__)
54 instances.set_last_error(domain, exception)
56 logger.debug("Returning empty list ... - EXIT!")
59 # iterating through all "suspended" (follow-only in its terminology)
60 # instances page-by-page, since that troonware doesn't support
61 # sending them all at once
63 logger.debug("Fetching offset=%d from domain='%s' ...", offset, domain)
65 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
71 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
79 logger.debug("fetched[]='%s'", type(fetched))
80 if "error_message" in fetched:
81 logger.warning("post_json_api() for domain='%s' returned error message: '%s'", domain, fetched['error_message'])
82 instances.set_last_error(domain, fetched)
84 elif isinstance(fetched["json"], dict) and "error" in fetched["json"] and "message" in fetched["json"]["error"]:
85 logger.warning("post_json_api() returned error: '%s'", fetched['error']['message'])
86 instances.set_last_error(domain, fetched["json"]["error"]["message"])
89 rows = fetched["json"]
91 logger.debug("rows(%d)[]='%s',step=%d", len(rows), type(rows), step)
93 logger.debug("Returned zero bytes, domain='%s' - BREAK!", domain)
95 elif len(rows) != config.get("misskey_limit"):
96 logger.debug("Fetched %d row(s) but expected: %d", len(rows), config.get('misskey_limit'))
97 offset = offset + (config.get("misskey_limit") - len(rows))
99 logger.debug("Raising offset by step=%d", step)
100 offset = offset + step
103 logger.debug("rows(%d))[]='%s'", len(rows), type(rows))
105 logger.debug("row()=%d", len(row))
106 if "host" not in row:
107 logger.warning("row()=%d does not contain key 'host': row='%s',domain='%s' - SKIPPED!", len(row), row, domain)
109 elif not isinstance(row["host"], str):
110 logger.warning("row[host][]='%s' is not of type 'str' - SKIPPED!", type(row['host']))
112 elif row["host"] in peers:
113 logger.debug("Not adding row[host]='%s', already found - SKIPPED!", row['host'])
115 elif not domain_helper.is_wanted(row["host"]):
116 logger.debug("row[host]='%s' is not wanted - SKIPPED!", row["host"])
119 logger.debug("Adding peer: row[host]='%s'", row['host'])
121 peers.append(row["host"])
123 logger.debug("added=%d,rows()=%d", added, len(rows))
125 logger.debug("Host returned already added (%d) peers - BREAK!", len(rows))
128 logger.debug("peers()=%d - EXIT!", len(peers))
131 def fetch_blocks(domain: str) -> list:
132 logger.debug("domain='%s' - CALLED!", domain)
133 domain_helper.raise_on(domain)
135 if blacklist.is_blacklisted(domain):
136 raise Exception(f"domain='{domain}' is blacklisted but function is invoked.")
137 elif not instances.is_registered(domain):
138 raise Exception(f"domain='{domain}' is not registered but function is invoked.")
140 # No CSRF by default, you don't have to add network.api_headers by yourself here
144 logger.debug("Checking CSRF for domain='%s' ...", domain)
145 headers = csrf.determine(domain, dict())
146 except network.exceptions as exception:
147 logger.warning("Exception '%s' during checking CSRF (fetch_blocks,%s)", type(exception), __name__)
148 instances.set_last_error(domain, exception)
150 logger.debug("Returning empty list ... - EXIT!")
155 step = config.get("misskey_limit")
157 # iterating through all "suspended" (follow-only in its terminology)
158 # instances page-by-page since it doesn't support sending them all at once
159 logger.debug("Fetching misskey blocks from domain='%s'", domain)
161 logger.debug("offset=%d", offset)
163 logger.debug("Fetching offset=%d from domain='%s' ...", offset, domain)
165 logger.debug("Sending JSON API request to domain='%s',step=%d,offset=%d", domain, step, offset)
166 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
173 logger.debug("Sending JSON API request to domain='%s',step=%d,offset=%d", domain, step, offset)
174 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
179 "offset" : offset - 1
182 logger.debug("fetched[]='%s'", type(fetched))
183 if "error_message" in fetched:
184 logger.warning("post_json_api() for domain='%s' returned error message: '%s'", domain, fetched['error_message'])
185 instances.set_last_error(domain, fetched)
187 elif isinstance(fetched["json"], dict) and "error" in fetched["json"] and "message" in fetched["json"]["error"]:
188 logger.warning("post_json_api() returned error: '%s'", fetched['error']['message'])
189 instances.set_last_error(domain, fetched["json"]["error"]["message"])
192 rows = fetched["json"]
194 logger.debug("rows(%d)[]='%s'", len(rows), type(rows))
196 logger.debug("Returned zero bytes, domain='%s' - BREAK!", domain)
198 elif len(rows) != config.get("misskey_limit"):
199 logger.debug("Fetched %d row(s) but expected: %d", len(rows), config.get('misskey_limit'))
200 offset = offset + (config.get("misskey_limit") - len(rows))
202 logger.debug("Raising offset by step=%d", step)
203 offset = offset + step
206 logger.debug("Checking %d row(s) of instances ...", len(rows))
207 for instance in rows:
209 logger.debug("instance[]='%s'", type(instance))
210 if "host" not in instance:
211 logger.warning("instance(%d)='%s' has no key 'host' - SKIPPED!", len(instance), instance)
213 elif instance["host"] in [None, ""]:
214 logger.debug("instance[host]='%s' is None or empty - SKIPPED!", instance["host"])
217 logger.debug("instance[host]='%s' - BEFORE!", instance["host"])
218 blocked = tidyup.domain(instance["host"])
219 logger.debug("blocked[%s]='%s' - AFTER!", type(blocked), blocked)
221 if blocked in [None, ""]:
222 logger.warning("instance[host]='%s' is None or empty after tidyup.domain() - SKIPPED!", instance["host"])
224 elif not domain_helper.is_wanted(blocked):
225 logger.debug("blocked='%s' is not wanted - SKIPPED!", blocked)
227 elif "isSuspended" in instance and instance["isSuspended"] and not dict_helper.has_key(blocklist, "blocked", blocked):
229 logger.debug("Appending blocker='%s',blocked='%s',block_level='suspended'", domain, blocked)
234 "block_level": "suspended",
237 logger.debug("count=%d", count)
239 logger.debug("API is no more returning new instances, aborting loop! domain='%s'", domain)
242 except network.exceptions as exception:
243 logger.warning("Caught error, exiting loop: domain='%s',exception[%s]='%s'", domain, type(exception), str(exception))
244 instances.set_last_error(domain, exception)
249 # Fetch blocked (full suspended) instances
250 logger.debug("offset=%d", offset)
253 logger.debug("Sending JSON API request to domain='%s',step=%d,offset=%d", domain, step, offset)
254 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
261 logger.debug("Sending JSON API request to domain='%s',step=%d,offset=%d", domain, step, offset)
262 fetched = network.post_json_api(domain, "/api/federation/instances", json.dumps({
267 "offset" : offset - 1
270 logger.debug("fetched[]='%s'", type(fetched))
271 if "error_message" in fetched:
272 logger.warning("post_json_api() for domain='%s' returned error message: '%s'", domain, fetched['error_message'])
273 instances.set_last_error(domain, fetched)
275 elif isinstance(fetched["json"], dict) and "error" in fetched["json"] and "message" in fetched["json"]["error"]:
276 logger.warning("post_json_api() returned error: '%s'", fetched['error']['message'])
277 instances.set_last_error(domain, fetched["json"]["error"]["message"])
280 rows = fetched["json"]
282 logger.debug("rows(%d)[]='%s'", len(rows), type(rows))
284 logger.debug("Returned zero bytes, domain='%s' - BREAK!", domain)
286 elif len(rows) != config.get("misskey_limit"):
287 logger.debug("Fetched %d row(s) but expected: %d'", len(rows), config.get('misskey_limit'))
288 offset = offset + (config.get("misskey_limit") - len(rows))
290 logger.debug("Raising offset by step=%d", step)
291 offset = offset + step
294 logger.debug("Checking %d row(s) of instances ...", len(rows))
295 for instance in rows:
297 logger.debug("instance[]='%s'", type(instance))
298 blocked = tidyup.domain(instance["host"])
299 logger.debug("blocked='%s'", blocked)
301 if blocked in [None, ""]:
302 logger.warning("instance[host]='%s' is None or empty after tidyup.domain() - SKIPPED!", instance["host"])
304 elif not domain_helper.is_wanted(blocked):
305 logger.debug("blocked='%s' is not wanted - SKIPPED!", blocked)
307 elif "isBlocked" in instance and instance["isBlocked"] and not dict_helper.has_key(blocklist, "blocked", blocked):
309 logger.debug("Appending blocker='%s',blocked='%s',block_level='reject'", domain, blocked)
314 "block_level": "reject",
317 logger.debug("count=%d", count)
319 logger.debug("API is no more returning new instances, aborting loop!")
322 except network.exceptions as exception:
323 logger.warning("Caught error, exiting loop: domain='%s',exception[%s]='%s'", domain, type(exception), str(exception))
324 instances.set_last_error(domain, exception)
328 logger.debug("blocklist()=%d - EXIT!", len(blocklist))