cry/cry/cli.py
John Doty cd20db0c4c Subscribe now searches
Rewrite feed finder again to not multi-fetch when not needed
2024-07-15 17:23:24 +09:00

295 lines
8.4 KiB
Python

# https://simonwillison.net/2023/Sep/30/cli-tools-python/
import asyncio
import html
import http.server
import io
import logging
import click
from . import feed
from . import feedfinder
from . import database
from . import opml
LOG = logging.getLogger(__name__)
@click.group()
@click.version_option()
@click.option(
"-v",
"--verbose",
count=True,
help="Increase the verbosity of the output. This option can be specified multiple times.",
)
def cli(verbose):
"Command line feed reader"
if verbose > 1:
level = logging.DEBUG
elif verbose > 0:
level = logging.INFO
else:
level = logging.WARN
logging.basicConfig(level=level)
@cli.command(name="search")
@click.argument("url")
def search(url):
"Search an URL for feeds."
# TODO: Rewrite to use our new one
feeds = feedfinder.find_feeds(url)
for feed in feeds:
click.echo(feed)
click.echo(f"Found {len(feeds)} feeds")
@cli.command(name="subscribe")
@click.argument("url")
@click.option("--literal/--no-literal", "-l/-L", default=False)
def subscribe(url, literal):
"Subscribe to a feed at the specified URL."
db = database.Database.local()
if not literal:
click.echo(f"Searching for feeds for {url} ...")
feeds = asyncio.run(feed.feed_search(url, db.origin))
if len(feeds) == 0:
click.echo(f"Unable to find a suitable feed for {url}")
return 1
if len(feeds) > 1:
# If we found more than one feed then we will try to see what the
# individual feeds are.
click.echo(f"Found {len(feeds)} feeds:")
max_title = max(len(f.title) for f in feeds)
max_url = max(len(f.meta.url) for f in feeds)
feeds.sort(key=lambda f: f.title)
for f in feeds:
click.echo(f"{f.title:{max_title}} {f.meta.url:{max_url}}")
click.echo(
"\nRun `subscribe` again with the URL of the feed you want to subscribe to."
)
return 1
result = feeds[0]
click.echo(f"Identified {result.meta.url} as a feed for {url}")
else:
click.echo(f"Fetching {url} ...")
meta = feed.FeedMeta.from_url(url, db.origin)
d, meta = asyncio.run(feed.fetch_feed(meta))
if d is None:
click.echo(f"Unable to fetch {url}")
return 1
if isinstance(d, str):
click.echo(f"{url} does not seem to be a feed")
return 1
result = d
# Check to see if this URL is already in the database.
existing = db.load_feed(result.meta.url)
if existing is not None:
click.echo(f"This feed already exists (as {result.meta.url})")
return 1
db.store_feed(result)
click.echo(f"Subscribed to {result.meta.url}")
@cli.command(name="import")
@click.argument("opml_file", type=click.File("r", encoding="utf-8"))
def import_opml(opml_file):
"Import the specified OPML file."
db = database.Database.local()
urls = opml.parse_opml(opml_file.read())
metas = [feed.FeedMeta.from_url(url, db.origin) for url in urls]
click.echo(f"Fetching {len(urls)} feeds ...")
results = asyncio.run(feed.fetch_many(metas))
subscribed = 0
for index, result in enumerate(results):
d, meta = result
url = urls[index]
if d is None:
LOG.warn(f"Unable to fetch {url}, skipping...")
continue
if isinstance(d, str):
click.echo(f"{url} does not seem to be a feed, skipping...")
continue
existing = db.load_feed(meta.url)
if existing is not None:
LOG.info(f"{url} already exists (as {meta.url})")
continue
db.store_feed(d)
subscribed = subscribed + 1
click.echo(f"Subscribed to {subscribed} new feeds")
@cli.command(name="refresh")
@click.argument("url", required=False, default=None)
def refresh(url):
"""Refresh one or more feeds.
If a URL is specified, refresh that URL. Otherwise, refresh all subscribed
feeds.
"""
db = database.Database.local()
if url:
f = db.load_feed(url)
if f is None:
click.echo(f"Not subscribed to {url}")
return 1
feeds = [f.meta]
else:
feeds = db.load_all_meta()
click.echo(f"Refreshing {len(feeds)} feed(s)...")
results = asyncio.run(feed.fetch_many(feeds))
new_count = 0
for d, meta in results:
if d is None:
# Nothing new.
db.update_meta(meta)
elif isinstance(d, str):
click.echo(f"WARNING: {meta.url} returned a non-feed result!")
else:
# New items, possibly!
new_count = new_count + db.store_feed(d)
click.echo(f"Fetched {new_count} new entries.")
@cli.command(name="show")
@click.argument("pattern", required=False, default="")
@click.option(
"--count",
"-c",
type=int,
default=10,
show_default=True,
help="Show at most this many entries from each feed.",
)
def show(pattern, count):
"""Show feeds and entries.
If a pattern is supplied, then filter the feeds to urls or titles that
match the pattern. Otherwise, just show everything.
"""
db = database.Database.local()
feeds = db.load_all(feed_limit=count, pattern=pattern or "")
feeds.sort(key=feed.sort_key, reverse=True)
for f in feeds:
click.echo(f"{f.title}")
if len(f.entries) > 0:
for entry in f.entries:
click.echo(f" {entry.title}")
else:
click.echo(f" <No Entries>")
click.echo()
@cli.command("list")
@click.argument("pattern", required=False, default="")
def list_feeds(pattern):
"""List subscribed feeds.
If a pattern is supplied, then filter the feeds to urls or titles that
match the pattern. Otherwise, just show everything.
"""
db = database.Database.local()
feeds = db.load_all(feed_limit=0, pattern=pattern)
max_title = max(len(f.title) for f in feeds)
max_url = max(len(f.meta.url) for f in feeds)
feeds.sort(key=lambda f: f.title)
for f in feeds:
click.echo(f"{f.title:{max_title}} {f.meta.url:{max_url}}")
@cli.command("unsubscribe")
@click.argument("url")
def unsubscribe(url):
"""Unsubscribe from the specified feed.
(If you need to find the URL for the feed to unsubscribe from, use the
`list` command.)
"""
db = database.Database.local()
count = db.set_feed_status(url, feed.FEED_STATUS_UNSUBSCRIBED)
if count == 0:
click.echo(f"Not subscribed to feed {url}")
return 1
@cli.command("serve")
def serve():
class Handler(http.server.BaseHTTPRequestHandler):
def do_GET(self):
db = database.Database.local()
feeds = db.load_all(feed_limit=10)
del db
feeds.sort(key=feed.sort_key, reverse=True)
buffer = io.StringIO()
buffer.write(
"""
<!doctype html>
<head>
<meta charset="utf8">
<title>Subscribed Feeds</title>
</head>
<h1>Feeds</h1>
"""
)
for f in feeds:
feed_title = html.escape(f.title)
if len(f.entries) > 0:
ago = f" ({f.entries[0].time_ago()})"
else:
ago = ""
buffer.write(f'<h2><a href="{f.link}">{feed_title}</a>{ago}</h2>')
buffer.write(f"<div>")
if len(f.entries) > 0:
for entry in f.entries:
title = html.escape(entry.title)
buffer.write(
f'<span class="entry">&bull; <a href="{entry.link}">{title}</a> ({entry.time_ago()})</span> '
)
else:
buffer.write("<i>No entries...</i>")
buffer.write(f"</div>")
buffer.flush()
text = buffer.getvalue()
response = text.encode("utf-8")
self.send_response(200)
self.send_header("content-type", "text/html")
self.send_header("content-length", str(len(response)))
self.end_headers()
self.wfile.write(response)
with http.server.HTTPServer(("", 8000), Handler) as server:
click.echo("Serving at http://127.0.0.1:8000/")
server.serve_forever()