From 3c6da51f845b94106d23b7b34d997df0df0009df Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 09:19:36 +0000 Subject: [PATCH 1/9] feeds/update.py: consider https AND http as a fallback --- pkgs/feeds/default.nix | 3 +-- pkgs/feeds/update.py | 10 +++++++--- 2 files changed, 8 insertions(+), 5 deletions(-) diff --git a/pkgs/feeds/default.nix b/pkgs/feeds/default.nix index 85931b71..4dc06c8f 100644 --- a/pkgs/feeds/default.nix +++ b/pkgs/feeds/default.nix @@ -28,14 +28,13 @@ '' sources_dir=modules/data/feeds/sources name="$1" - url="https://$name" json_path="$sources_dir/$name/default.json" # the name could have slashes in it, so we want to mkdir -p that # but in a way where the least could go wrong. pushd "$sources_dir"; mkdir -p "$name"; popd - ${./update.py} "$url" "$json_path" + ${./update.py} "$name" "$json_path" cat "$json_path" ''; } diff --git a/pkgs/feeds/update.py b/pkgs/feeds/update.py index 1ac2114e..1e9c3364 100755 --- a/pkgs/feeds/update.py +++ b/pkgs/feeds/update.py @@ -13,9 +13,13 @@ logging.getLogger().setLevel(logging.DEBUG) logging.getLogger().addHandler(logging.StreamHandler(sys.stdout)) logging.getLogger(__name__).debug("logging enabled") -url = coerce_url(url, default_scheme="https") -items = search(url, total_timeout=180, request_timeout=90, max_content_length=100*1024*1024) -items = sort_urls(items) +def try_scheme(url: str, scheme: str): + url = coerce_url(url, default_scheme=scheme) + print(f"trying {url}") + items = search(url, total_timeout=180, request_timeout=90, max_content_length=100*1024*1024) + return sort_urls(items) + +items = try_scheme(url, "https") or try_scheme(url, "http") # print all results serialized = [item.serialize() for item in items] From 6eb81915143240f72eaea2ae227e23fe97eba070 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 09:41:27 +0000 Subject: [PATCH 2/9] feeds: subscribe to Aaron Scott / textfiles.com --- hosts/common/feeds.nix | 1 + .../sources/ascii.textfiles.com/default.json | 21 +++++++++++++++++++ 2 files changed, 22 insertions(+) create mode 100644 modules/data/feeds/sources/ascii.textfiles.com/default.json diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index 45c2d8b0..69e0957f 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -112,6 +112,7 @@ let # DEVELOPERS (fromDb "uninsane.org" // tech) + (fromDb "ascii.textfiles.com" // tech) # Jason Scott (fromDb "mg.lol" // tech) (fromDb "drewdevault.com" // tech) ## Ken Shirriff diff --git a/modules/data/feeds/sources/ascii.textfiles.com/default.json b/modules/data/feeds/sources/ascii.textfiles.com/default.json new file mode 100644 index 00000000..8f7d6ccb --- /dev/null +++ b/modules/data/feeds/sources/ascii.textfiles.com/default.json @@ -0,0 +1,21 @@ +{ + "bozo": 0, + "content_length": 362082, + "content_type": "application/rss+xml; charset=utf-8", + "description": "Jason Scott's Weblog", + "favicon": "https://ascii.textfiles.com/wp-includes/images/w-logo-blue-white-bg.png", + "favicon_data_uri": "", + "hubs": [], + "is_podcast": false, + "is_push": false, + "item_count": 20, + "last_updated": "2023-03-06T07:13:07+00:00", + "score": 14, + "self_url": "https://ascii.textfiles.com/feed", + "site_name": "ASCII by Jason Scott", + "site_url": "https://ascii.textfiles.com", + "title": "ASCII by Jason Scott", + "url": "https://ascii.textfiles.com/feed", + "velocity": 0.008, + "version": "rss20" +} \ No newline at end of file From 0ecc08b49dfa7b682eb5b32bdca5dd9c60cca1e2 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 22:52:08 +0000 Subject: [PATCH 3/9] feeds: subscribe to LessWrong Curated --- hosts/common/feeds.nix | 2 ++ .../feeds.libsyn.com/421877/default.json | 23 +++++++++++++++++++ 2 files changed, 25 insertions(+) create mode 100644 modules/data/feeds/sources/feeds.libsyn.com/421877/default.json diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index 69e0957f..c7480793 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -50,6 +50,8 @@ let (fromDb "lexfridman.com/podcast" // rat) ## Astral Codex Ten (fromDb "sscpodcast.libsyn.com" // rat) + ## Less Wrong Curated + (fromDb "feeds.libsyn.com/421877" // rat) ## Econ Talk (fromDb "feeds.simplecast.com/wgl4xEgL" // rat) ## Cory Doctorow -- both podcast & text entries diff --git a/modules/data/feeds/sources/feeds.libsyn.com/421877/default.json b/modules/data/feeds/sources/feeds.libsyn.com/421877/default.json new file mode 100644 index 00000000..28282c35 --- /dev/null +++ b/modules/data/feeds/sources/feeds.libsyn.com/421877/default.json @@ -0,0 +1,23 @@ +{ + "bozo": 0, + "content_length": 272569, + "content_type": "text/xml; charset=utf-8", + "description": "Audio version of the posts shared in the LessWrong Curated newsletter.", + "favicon": "", + "favicon_data_uri": "", + "hubs": [ + "https://pubsubhubbub.appspot.com/" + ], + "is_podcast": true, + "is_push": true, + "item_count": 56, + "last_updated": "2023-03-08T08:00:00+00:00", + "score": 32, + "self_url": "https://feeds.buzzsprout.com/2037297.rss", + "site_name": "", + "site_url": "", + "title": "LessWrong Curated Podcast", + "url": "https://feeds.buzzsprout.com/2037297.rss", + "velocity": 0.192, + "version": "rss20" +} \ No newline at end of file From edf21e68378cc88822ad69aebd1f6700dd4da032 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 23:09:24 +0000 Subject: [PATCH 4/9] feeds: subscribe to Daniel Huberman podcast --- hosts/common/feeds.nix | 2 ++ .../hubermanlab/default.json | 21 +++++++++++++++++++ 2 files changed, 23 insertions(+) create mode 100644 modules/data/feeds/sources/feeds.megaphone.fm/hubermanlab/default.json diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index c7480793..52e1deba 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -62,6 +62,8 @@ let ## Emerge: making sense of what's next -- (mkPod "https://anchor.fm/s/21bc734/podcast/rss" // pol // infrequent) (fromDb "feeds.feedburner.com/80000HoursPodcast" // rat) + ## Daniel Huberman on sleep + (fromDb "feeds.megaphone.fm/hubermanlab" // uncat) (fromDb "allinchamathjason.libsyn.com" // pol) (fromDb "acquired.libsyn.com" // tech) # The Intercept - Deconstructed; also available: diff --git a/modules/data/feeds/sources/feeds.megaphone.fm/hubermanlab/default.json b/modules/data/feeds/sources/feeds.megaphone.fm/hubermanlab/default.json new file mode 100644 index 00000000..d4f6be8b --- /dev/null +++ b/modules/data/feeds/sources/feeds.megaphone.fm/hubermanlab/default.json @@ -0,0 +1,21 @@ +{ + "bozo": 0, + "content_length": 1377252, + "content_type": "application/xml; charset=utf-8", + "description": "Andrew Huberman, Ph.D.", + "favicon": "", + "favicon_data_uri": "", + "hubs": [], + "is_podcast": true, + "is_push": false, + "item_count": 129, + "last_updated": "2023-03-06T09:00:00+00:00", + "score": 14, + "self_url": "https://feeds.megaphone.fm/hubermanlab", + "site_name": "", + "site_url": "", + "title": "Huberman Lab", + "url": "https://feeds.megaphone.fm/hubermanlab", + "velocity": 0.159, + "version": "rss20" +} \ No newline at end of file From eae8ef11c847d5f94788e2168562beb5ff6e3db4 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 23:35:45 +0000 Subject: [PATCH 5/9] feeds: subscribe to MAPS --- hosts/common/feeds.nix | 3 +++ .../mapspodcast.libsyn.com/default.json | 21 +++++++++++++++++++ 2 files changed, 24 insertions(+) create mode 100644 modules/data/feeds/sources/mapspodcast.libsyn.com/default.json diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index 52e1deba..5d16a336 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -57,6 +57,7 @@ let ## Cory Doctorow -- both podcast & text entries (fromDb "craphound.com" // pol) (fromDb "congressionaldish.libsyn.com" // pol) + (mkPod "https://podcasts.la.utexas.edu/this-is-democracy/feed/podcast/" // pol // weekly) ## Civboot -- https://anchor.fm/civboot (fromDb "anchor.fm/s/34c7232c/podcast/rss" // tech) ## Emerge: making sense of what's next -- @@ -64,6 +65,8 @@ let (fromDb "feeds.feedburner.com/80000HoursPodcast" // rat) ## Daniel Huberman on sleep (fromDb "feeds.megaphone.fm/hubermanlab" // uncat) + ## Multidisciplinary Association for Psychedelic Studies + (fromDb "mapspodcast.libsyn.com" // uncat) (fromDb "allinchamathjason.libsyn.com" // pol) (fromDb "acquired.libsyn.com" // tech) # The Intercept - Deconstructed; also available: diff --git a/modules/data/feeds/sources/mapspodcast.libsyn.com/default.json b/modules/data/feeds/sources/mapspodcast.libsyn.com/default.json new file mode 100644 index 00000000..41139bd3 --- /dev/null +++ b/modules/data/feeds/sources/mapspodcast.libsyn.com/default.json @@ -0,0 +1,21 @@ +{ + "bozo": 0, + "content_length": 256360, + "content_type": "application/rss+xml; charset=utf-8", + "description": "Hosted by Zach Leary, the intent of the podcast is to bring you the listener an easily accessible resource for a variety of topics all related to psychedelic research. There is a lot to learn about new research into the therapeutic potential of psychedelics and marijuana. Over the years, the Multidisciplinary Association for Psychedelic Studies (MAPS) has amassed an incredible treasure trove of audio archives sourced from the amazing talks, presentations and panels that have taken place at past Psychedelic Science conferences and other unique events. By selecting some of that content and then bringing it to you in a podcast we hope to create a centralized location for the greater MAPS community. If you're a researcher, scientist, medical professional or just a curiosity seeker we hope that you'll find this content a valuable resource tool.\n\nPlease visit the MAPS website at https://maps.org", + "favicon": "", + "favicon_data_uri": "", + "hubs": [], + "is_podcast": true, + "is_push": false, + "item_count": 62, + "last_updated": "2023-03-06T20:20:00+00:00", + "score": 0, + "self_url": "https://feeds.libsyn.com/95610/rss", + "site_name": "", + "site_url": "", + "title": "MAPS Podcast", + "url": "https://feeds.libsyn.com/95610/rss", + "velocity": 0.028, + "version": "rss20" +} \ No newline at end of file From 6fe29529b21f56c70ffb2132b9ea879326301c78 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 23:36:16 +0000 Subject: [PATCH 6/9] init-feeds script: handle unedited url arguments --- pkgs/feeds/default.nix | 10 +++++++++- 1 file changed, 9 insertions(+), 1 deletion(-) diff --git a/pkgs/feeds/default.nix b/pkgs/feeds/default.nix index 4dc06c8f..6aeead05 100644 --- a/pkgs/feeds/default.nix +++ b/pkgs/feeds/default.nix @@ -26,8 +26,16 @@ passthru.initFeedScript = pkgs.writeShellScript "init-feed" '' + # this is the `nix run '.#init-feed' ` script` sources_dir=modules/data/feeds/sources - name="$1" + # prettify the URL, by default + name=$( \ + echo "$1" \ + | sed 's|^https://||' \ + | sed 's|^http://||' \ + | sed 's|^www\.||' \ + | sed 's|/+$||' \ + ) json_path="$sources_dir/$name/default.json" # the name could have slashes in it, so we want to mkdir -p that From 9f5d1c01118c04eeada2bce9ed04cbca46463e47 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 23:45:58 +0000 Subject: [PATCH 7/9] zsh: ignore "nixos-rebuild switch" in history --- hosts/common/home/zsh/default.nix | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/hosts/common/home/zsh/default.nix b/hosts/common/home/zsh/default.nix index d63d1136..c1486b9a 100644 --- a/hosts/common/home/zsh/default.nix +++ b/hosts/common/home/zsh/default.nix @@ -74,7 +74,7 @@ in # see for an example: autoload -Uz zmv - HISTORY_IGNORE='(sane-shutdown *|sane-reboot *|rm *)' + HISTORY_IGNORE='(sane-shutdown *|sane-reboot *|rm *|nixos-rebuild.* switch)' # extra aliases # TODO: move to `shellAliases` config? From cb4ca7d26a68aa3443254f09de2caee46d812d96 Mon Sep 17 00:00:00 2001 From: Colin Date: Wed, 8 Mar 2023 23:50:34 +0000 Subject: [PATCH 8/9] feeds: document the Nonlinear Library --- hosts/common/feeds.nix | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index 5d16a336..9e514577 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -1,3 +1,7 @@ +# candidates: +# - The Nonlinear Library (podcast): +# - has ~10 posts per day, text-to-speech; i would need better tagging before adding this + { lib, sane-data, ... }: let hourly = { freq = "hourly"; }; From e5cdcc4500c3c7b498a8a6c5594ec68663c71ba0 Mon Sep 17 00:00:00 2001 From: Colin Date: Thu, 9 Mar 2023 00:33:27 +0000 Subject: [PATCH 9/9] feeds: document Metaculus Journal --- hosts/common/feeds.nix | 2 ++ 1 file changed, 2 insertions(+) diff --git a/hosts/common/feeds.nix b/hosts/common/feeds.nix index 9e514577..32b71cd0 100644 --- a/hosts/common/feeds.nix +++ b/hosts/common/feeds.nix @@ -1,6 +1,8 @@ # candidates: # - The Nonlinear Library (podcast): # - has ~10 posts per day, text-to-speech; i would need better tagging before adding this +# - +# - dead since 2022/10 - 2023/03 { lib, sane-data, ... }: let