2023-11-13 14:45:10 +01:00
|
|
|
"""
|
|
|
|
|
|
|
|
FIXME
|
|
|
|
|
|
|
|
1) Check feed duplication on runtime.
|
|
|
|
When feed is valid and is not yet in the database it is
|
|
|
|
posible to send a batch which would result in duplication.
|
|
|
|
Consequently, it might result in database lock error upon
|
|
|
|
feed removal attempt
|
|
|
|
|
2024-02-10 18:53:53 +01:00
|
|
|
2) Communicate to messages of new contacts (not subscribed and not in roster)
|
2023-11-13 14:45:10 +01:00
|
|
|
|
2024-02-10 18:53:53 +01:00
|
|
|
TODO
|
2023-12-04 15:41:02 +01:00
|
|
|
|
2023-12-28 15:50:23 +01:00
|
|
|
2) Machine Learning for scrapping Title, Link, Summary and Timstamp;
|
2023-12-24 19:37:05 +01:00
|
|
|
Scrape element </article> (example: Liferea)
|
|
|
|
http://intertwingly.net/blog/
|
|
|
|
https://www.brandenburg.de/
|
2023-11-13 14:45:10 +01:00
|
|
|
|
2023-12-28 15:50:23 +01:00
|
|
|
3) Set MUC subject
|
2023-12-04 15:41:02 +01:00
|
|
|
Feeds which entries are to be set as groupchat subject.
|
|
|
|
Perhaps not, as it would require to check every feed for this setting.
|
2023-12-24 19:37:05 +01:00
|
|
|
Maybe a separate bot;
|
2023-11-13 14:45:10 +01:00
|
|
|
|
2024-02-10 18:53:53 +01:00
|
|
|
5) OMEMO;
|
2023-11-13 14:45:10 +01:00
|
|
|
|
2024-02-10 18:53:53 +01:00
|
|
|
6) Logging;
|
2023-12-24 19:37:05 +01:00
|
|
|
https://docs.python.org/3/howto/logging.html
|
2023-11-13 14:45:10 +01:00
|
|
|
|
2024-01-06 23:03:08 +01:00
|
|
|
9.1) IDEA: Bot to display Title and Excerpt
|
|
|
|
(including sending a PDF version of it) of posted link
|
|
|
|
|
2024-01-09 16:53:19 +01:00
|
|
|
10) Fetch summary from URL, instead of storing summary, or
|
2023-12-04 15:41:02 +01:00
|
|
|
Store 5 upcoming summaries.
|
|
|
|
This would help making the database files smaller.
|
2023-11-15 15:02:39 +01:00
|
|
|
|
2024-01-09 16:53:19 +01:00
|
|
|
13) Tip Of The Day.
|
2023-11-22 12:47:34 +01:00
|
|
|
Did you know that you can follow you favorite Mastodon feeds by just
|
|
|
|
sending the URL address?
|
|
|
|
Supported fediverse websites are:
|
2024-01-02 12:42:41 +01:00
|
|
|
Akkoma, Firefish (Calckey), Friendica, HubZilla,
|
|
|
|
Mastodon, Misskey, Pixelfed, Pleroma, Socialhome, Soapbox.
|
2023-11-22 12:47:34 +01:00
|
|
|
|
2024-01-09 16:53:19 +01:00
|
|
|
14) Brand: News Broker, Newsman, Newsdealer, Laura Harbinger
|
2023-12-24 19:37:05 +01:00
|
|
|
|
2024-01-09 16:53:19 +01:00
|
|
|
16) Search messages of government regulated publishers, and promote other sources.
|
2023-12-24 19:37:05 +01:00
|
|
|
Dear reader, we couldn't get news from XYZ as they don't provide RSS feeds.
|
|
|
|
However, you might want to get news from (1) (2) and (3) instead!
|
2023-12-11 10:04:45 +01:00
|
|
|
|
2024-02-10 18:53:53 +01:00
|
|
|
17) The operator account will be given reports from the bot about its
|
2024-01-14 19:05:12 +01:00
|
|
|
activities every X minutes.
|
|
|
|
When a suspicious activity is detected, it will be reported immediately.
|
|
|
|
|
2023-11-13 14:45:10 +01:00
|
|
|
"""
|
2023-07-16 17:23:10 +02:00
|
|
|
|
|
|
|
# vars and their meanings:
|
|
|
|
# jid = Jabber ID (XMPP)
|
|
|
|
# res = response (HTTP)
|
|
|
|
from argparse import ArgumentParser
|
2024-01-18 21:57:49 +01:00
|
|
|
from getpass import getpass
|
|
|
|
import sys
|
2023-12-11 10:04:45 +01:00
|
|
|
import configparser
|
2023-12-28 15:50:23 +01:00
|
|
|
# import filehandler
|
|
|
|
# from slixfeed.file import get_default_confdir
|
2023-07-16 17:23:10 +02:00
|
|
|
from getpass import getpass
|
|
|
|
import logging
|
2023-12-11 10:04:45 +01:00
|
|
|
import os
|
2023-07-16 17:23:10 +02:00
|
|
|
|
2023-12-04 15:41:02 +01:00
|
|
|
# from datetime import date
|
|
|
|
# import time
|
2023-07-16 17:23:10 +02:00
|
|
|
|
2023-09-29 13:49:24 +02:00
|
|
|
# from eliot import start_action, to_file
|
2024-02-04 19:19:56 +01:00
|
|
|
# # to_file(open('slixfeed.log', 'w'))
|
|
|
|
# # with start_action(action_type='set_date()', jid=jid):
|
|
|
|
# # with start_action(action_type='message()', msg=msg):
|
2023-07-16 17:23:10 +02:00
|
|
|
|
2024-01-24 19:11:39 +01:00
|
|
|
#import slixfeed.smtp
|
|
|
|
#import slixfeed.irc
|
|
|
|
#import slixfeed.matrix
|
|
|
|
|
2024-02-04 18:08:12 +01:00
|
|
|
import slixfeed.config as config
|
2024-02-04 19:19:56 +01:00
|
|
|
from slixfeed.version import __version__
|
2023-07-16 17:23:10 +02:00
|
|
|
|
2024-03-07 07:56:11 +01:00
|
|
|
# import socks
|
|
|
|
# import socket
|
2024-01-22 13:48:00 +01:00
|
|
|
|
2024-06-02 08:35:07 +02:00
|
|
|
account_xmpp = config.get_values('accounts.toml', 'xmpp')
|
2024-01-22 13:48:00 +01:00
|
|
|
|
2024-06-02 08:35:07 +02:00
|
|
|
# account = ConfigAccount() # TODO ~Delete~ Clear as soon as posible after is no longer needed
|
2024-01-22 13:48:00 +01:00
|
|
|
|
2024-01-18 21:57:49 +01:00
|
|
|
def main():
|
|
|
|
|
2024-02-04 18:08:12 +01:00
|
|
|
config_dir = config.get_default_config_directory()
|
2024-02-04 19:19:56 +01:00
|
|
|
logging.info('Reading configuration from {}'.format(config_dir))
|
|
|
|
print('Reading configuration from {}'.format(config_dir))
|
2024-03-13 17:17:43 +01:00
|
|
|
network_settings = config.get_values('settings.toml', 'network')
|
|
|
|
print('User agent:', network_settings['user_agent'] or 'Slixfeed/0.1')
|
|
|
|
if network_settings['http_proxy']: print('HTTP Proxy:', network_settings['http_proxy'])
|
2024-01-26 12:34:07 +01:00
|
|
|
|
2024-02-19 21:50:53 +01:00
|
|
|
# values = config.get_value('accounts', 'XMPP Proxy',
|
|
|
|
# ['socks5_host', 'socks5_port'])
|
|
|
|
# if values[0] and values[1]:
|
|
|
|
# host = values[0]
|
|
|
|
# port = values[1]
|
|
|
|
# s = socks.socksocket()
|
|
|
|
# s.set_proxy(socks.SOCKS5, host, port)
|
|
|
|
# # socks.set_default_proxy(socks.SOCKS5, host, port)
|
|
|
|
# # socket.socket = socks.socksocket
|
2024-01-22 13:48:00 +01:00
|
|
|
|
2024-06-02 08:35:07 +02:00
|
|
|
#parser = ArgumentParser(description=Slixfeed.__doc__)
|
|
|
|
parser = ArgumentParser(description='Slixfeed News Bot')
|
2024-01-18 21:57:49 +01:00
|
|
|
|
2024-06-02 08:35:07 +02:00
|
|
|
# Setup the command line arguments.
|
2024-02-04 19:19:56 +01:00
|
|
|
parser.add_argument('-v', '--version', help='Print version',
|
|
|
|
action='version', version=__version__)
|
|
|
|
|
2024-01-18 21:57:49 +01:00
|
|
|
# Output verbosity options.
|
2024-02-04 19:19:56 +01:00
|
|
|
parser.add_argument('-q', '--quiet', help='set logging to ERROR',
|
|
|
|
action='store_const', dest='loglevel',
|
2024-02-04 18:08:12 +01:00
|
|
|
const=logging.ERROR, default=logging.INFO)
|
2024-02-04 19:19:56 +01:00
|
|
|
parser.add_argument('-d', '--debug', help='set logging to DEBUG',
|
|
|
|
action='store_const', dest='loglevel',
|
2024-02-04 18:08:12 +01:00
|
|
|
const=logging.DEBUG, default=logging.INFO)
|
2024-01-18 21:57:49 +01:00
|
|
|
|
|
|
|
# JID and password options.
|
2024-02-04 19:19:56 +01:00
|
|
|
parser.add_argument('-j', '--jid', help='Jabber ID', dest='jid')
|
|
|
|
parser.add_argument('-p', '--password', help='Password of JID',
|
|
|
|
dest='password')
|
|
|
|
parser.add_argument('-a', '--alias', help='Display name', dest='alias')
|
|
|
|
parser.add_argument('-n', '--hostname', help='Hostname', dest='hostname')
|
|
|
|
parser.add_argument('-o', '--port', help='Port number', dest='port')
|
2024-01-18 21:57:49 +01:00
|
|
|
|
|
|
|
args = parser.parse_args()
|
|
|
|
|
|
|
|
# Setup logging.
|
2024-02-04 18:08:12 +01:00
|
|
|
logging.basicConfig(level=args.loglevel,
|
|
|
|
format='%(levelname)-8s %(message)s')
|
2024-01-18 21:57:49 +01:00
|
|
|
|
2024-03-03 15:13:01 +01:00
|
|
|
# # Setup logging.
|
|
|
|
# logging.basicConfig(level=args.loglevel,
|
|
|
|
# format='%(levelname)-8s %(message)s')
|
|
|
|
# # logging.basicConfig(format='[%(levelname)s] %(message)s')
|
|
|
|
# logger = logging.getLogger()
|
|
|
|
# logdbg = logger.debug
|
|
|
|
# logerr = logger.error
|
|
|
|
# lognfo = logger.info
|
|
|
|
# logwrn = logger.warning
|
|
|
|
|
2024-06-02 08:35:07 +02:00
|
|
|
# NOTE Temporarily archived
|
|
|
|
# NOTE Consider removal of arguments jid, password and alias
|
|
|
|
|
|
|
|
# # Try configuration file
|
|
|
|
# jid = account[account_mode]['jid']
|
|
|
|
# password = account[account_mode]['password']
|
|
|
|
# alias = account[account_mode]['alias'] if 'alias' in account[account_mode] else None
|
|
|
|
# hostname = account[account_mode]['hostname'] if 'hostname' in account[account_mode] else None
|
|
|
|
# port = account[account_mode]['port'] if 'port' in account[account_mode] else None
|
|
|
|
|
|
|
|
# # Use arguments if were given
|
|
|
|
# if args.jid:
|
|
|
|
# jid = args.jid
|
|
|
|
# if args.password:
|
|
|
|
# password = args.password
|
|
|
|
# if args.alias:
|
|
|
|
# alias = args.alias
|
|
|
|
# if args.hostname:
|
|
|
|
# hostname = args.hostname
|
|
|
|
# if args.port:
|
|
|
|
# port = args.port
|
|
|
|
|
|
|
|
# # Prompt for credentials if none were given
|
|
|
|
# if not jid:
|
|
|
|
# jid = input('JID: ')
|
|
|
|
# if not password:
|
|
|
|
# password = getpass('Password: ')
|
|
|
|
# if not alias:
|
|
|
|
# alias = (input('Alias: ')) or 'Slixfeed'
|
|
|
|
|
2024-01-18 21:57:49 +01:00
|
|
|
# Try configuration file
|
2024-06-02 08:35:07 +02:00
|
|
|
if 'client' in account_xmpp:
|
|
|
|
from slixfeed.xmpp.client import Slixfeed
|
|
|
|
jid = account_xmpp['client']['jid']
|
|
|
|
password = account_xmpp['client']['password']
|
|
|
|
alias = account_xmpp['client']['alias'] if 'alias' in account_xmpp['client'] else None
|
|
|
|
hostname = account_xmpp['client']['hostname'] if 'hostname' in account_xmpp['client'] else None
|
|
|
|
port = account_xmpp['client']['port'] if 'port' in account_xmpp['client'] else None
|
|
|
|
Slixfeed(jid, password, hostname, port, alias)
|
|
|
|
|
|
|
|
if 'component' in account_xmpp:
|
|
|
|
from slixfeed.xmpp.component import SlixfeedComponent
|
|
|
|
jid = account_xmpp['component']['jid']
|
|
|
|
password = account_xmpp['component']['password']
|
|
|
|
alias = account_xmpp['component']['alias'] if 'alias' in account_xmpp['component'] else None
|
|
|
|
hostname = account_xmpp['component']['hostname'] if 'hostname' in account_xmpp['component'] else None
|
|
|
|
port = account_xmpp['component']['port'] if 'port' in account_xmpp['component'] else None
|
|
|
|
SlixfeedComponent(jid, password, hostname, port, alias).process()
|
|
|
|
|
2024-01-18 21:57:49 +01:00
|
|
|
sys.exit(0)
|
|
|
|
|
2024-02-04 19:19:56 +01:00
|
|
|
if __name__ == '__main__':
|
2024-01-18 21:57:49 +01:00
|
|
|
main()
|