Improve privacy relace
This commit is contained in:
		
							parent
							
								
									6d2db24c33
								
							
						
					
					
						commit
						d378e17173
					
				
					 5 changed files with 13 additions and 17 deletions
				
			
		|  | @ -2,7 +2,6 @@ import hashlib | |||
| from datetime import datetime | ||||
| from functools import cached_property | ||||
| from typing import Any | ||||
| from urllib.parse import urlparse | ||||
| 
 | ||||
| import pydantic | ||||
| from bs4 import BeautifulSoup  # type: ignore | ||||
|  | @ -12,8 +11,8 @@ from app import activitypub as ap | |||
| from app.actor import LOCAL_ACTOR | ||||
| from app.actor import Actor | ||||
| from app.actor import RemoteActor | ||||
| from app.config import PRIVACY_REPLACE | ||||
| from app.media import proxied_media_url | ||||
| from app.utils import privacy_replace | ||||
| from app.utils.datetime import now | ||||
| from app.utils.datetime import parse_isoformat | ||||
| 
 | ||||
|  | @ -179,20 +178,7 @@ class Object: | |||
|         if self.ap_object.get("mediaType") == "text/markdown": | ||||
|             content = markdown(content, extensions=["mdx_linkify"]) | ||||
| 
 | ||||
|         if not PRIVACY_REPLACE: | ||||
|             return content | ||||
| 
 | ||||
|         soup = BeautifulSoup(content, "html5lib") | ||||
|         links = soup.find_all("a", href=True) | ||||
| 
 | ||||
|         for link in links: | ||||
|             parsed_href = urlparse(link.attrs["href"]) | ||||
|             if new_netloc := PRIVACY_REPLACE.get( | ||||
|                 parsed_href.netloc.removeprefix("www.") | ||||
|             ): | ||||
|                 link.attrs["href"] = parsed_href._replace(netloc=new_netloc).geturl() | ||||
| 
 | ||||
|         return soup.find("body").decode_contents() | ||||
|         return privacy_replace.replace_content(content) | ||||
| 
 | ||||
|     @property | ||||
|     def summary(self) -> str | None: | ||||
|  |  | |||
|  | @ -32,6 +32,7 @@ from app.config import generate_csrf_token | |||
| from app.config import session_serializer | ||||
| from app.database import AsyncSession | ||||
| from app.media import proxied_media_url | ||||
| from app.utils import privacy_replace | ||||
| from app.utils.datetime import now | ||||
| from app.utils.highlight import HIGHLIGHT_CSS | ||||
| from app.utils.highlight import highlight | ||||
|  | @ -400,3 +401,4 @@ _templates.env.filters["emojify"] = _emojify | |||
| _templates.env.filters["pluralize"] = _pluralize | ||||
| _templates.env.filters["parse_datetime"] = _parse_datetime | ||||
| _templates.env.filters["poll_item_pct"] = _poll_item_pct | ||||
| _templates.env.filters["privacy_replace_url"] = privacy_replace.replace_url | ||||
|  |  | |||
|  | @ -317,7 +317,7 @@ | |||
|     </div> | ||||
|     {% endif %} | ||||
|     <div> | ||||
|         <a href="{{ og_meta.url }}">{{ og_meta.title }}</a> | ||||
|         <a href="{{ og_meta.url | privacy_replace_url }}">{{ og_meta.title }}</a> | ||||
|         {% if og_meta.site_name %} | ||||
|             <small style="display:block;">{{ og_meta.site_name }}</small> | ||||
|         {% endif %} | ||||
|  |  | |||
|  | @ -15,6 +15,7 @@ from app.database import AsyncSession | |||
| from app.models import InboxObject | ||||
| from app.models import OutboxObject | ||||
| from app.utils.url import is_url_valid | ||||
| from app.utils.url import make_abs | ||||
| 
 | ||||
| 
 | ||||
| class OpenGraphMeta(BaseModel): | ||||
|  | @ -46,6 +47,10 @@ def _scrap_og_meta(url: str, html: str) -> OpenGraphMeta | None: | |||
|     if "title" not in raw: | ||||
|         return None | ||||
| 
 | ||||
|     for maybe_rel in {"url", "image"}: | ||||
|         if u := raw.get(maybe_rel): | ||||
|             raw[maybe_rel] = make_abs(u, url) | ||||
| 
 | ||||
|     return OpenGraphMeta.parse_obj(raw) | ||||
| 
 | ||||
| 
 | ||||
|  |  | |||
|  | @ -43,6 +43,9 @@ To do so, just add as these extra config items, this is a sample config that rew | |||
| domain = "youtube.com" | ||||
| replace_by  ="yewtu.be" | ||||
| [[privacy_replace]] | ||||
| domain = "youtu.be" | ||||
| replace_by = "yewtu.be" | ||||
| [[privacy_replace]] | ||||
| domain = "twitter.com" | ||||
| replace_by = "nitter.net" | ||||
| [[privacy_replace]] | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue