From 9bbd659bf5bb083a1e2bd0005d944ef40c490b04 Mon Sep 17 00:00:00 2001 From: Lynne Date: Fri, 11 Jan 2019 22:58:17 +1000 Subject: [PATCH] main.py now uses functions.py's extract_toot func --- main.py | 32 ++------------------------------ 1 file changed, 2 insertions(+), 30 deletions(-) diff --git a/main.py b/main.py index e4c0662..c56388c 100755 --- a/main.py +++ b/main.py @@ -9,6 +9,7 @@ from os import path from bs4 import BeautifulSoup import os, sqlite3, signal, sys, json, re import requests +import functions scopes = ["read:statuses", "read:accounts", "read:follows", "write:statuses", "read:notifications"] cfg = json.load(open('config.json', 'r')) @@ -56,36 +57,7 @@ if "secret" not in cfg: json.dump(cfg, open("config.json", "w+")) def extract_toot(toot): - toot = toot.replace("'", "'") - toot = toot.replace(""", '"') - soup = BeautifulSoup(toot, "html.parser") - - # this is the code that removes all mentions - for mention in soup.select("span.h-card"): - mention.a.unwrap() - mention.span.unwrap() - - # replace
with linebreak - for lb in soup.select("br"): - lb.insert_after("\n") - lb.decompose() - - # replace

with linebreak - for p in soup.select("p"): - p.insert_after("\n") - p.unwrap() - - # fix hashtags - for ht in soup.select("a.hashtag"): - ht.unwrap() - - # fix links - for link in soup.select("a"): - link.insert_after(link["href"]) - link.decompose() - - toot = soup.get_text() - toot = toot.rstrip("\n") #remove trailing newline + toot = functions.extract_toot(toot) toot = toot.replace("@", "@\u200B") #put a zws between @ and username to avoid mentioning return(toot)