|
1 | 1 | { |
2 | 2 | "title": "Public Data", |
3 | 3 | "tagline": "Open datasets generated and published by the Podcast Index project.", |
4 | | - "intro": "Podcast Index produces a number of public data exports — full feed catalogs, recommendation lists, value-block dumps, activity stats, and infrastructure pointers — all served as static files under public.podcastindex.org and a few sibling subdomains. They are free to mirror and use; please don't hammer them in tight loops, and prefer the SQLite/CSV catalog dumps over live API scraping when you need bulk data.", |
| 4 | + "intro": "Podcast Index produces a number of public data exports - full feed catalogs, recommendation lists, value-block dumps, activity stats, and infrastructure pointers - all served as static files under public.podcastindex.org and a few sibling subdomains. They are free to mirror and use; please don't hammer them in tight loops, and prefer the SQLite/CSV catalog dumps over live API scraping when you need bulk data.", |
5 | 5 | "sections": [ |
6 | 6 | { |
7 | 7 | "id": "catalog", |
8 | 8 | "name": "Catalog snapshots", |
9 | | - "description": "Full feed catalogs. The SQLite dumps are the canonical bulk artifacts — load them directly with sqlite3 or any client.", |
| 9 | + "description": "Full feed catalogs. The SQLite dumps are the canonical bulk artifacts - load them directly with sqlite3 or any client.", |
10 | 10 | "datasets": [ |
11 | 11 | { |
12 | | - "name": "All live feeds — SQLite", |
| 12 | + "name": "All live feeds - SQLite", |
13 | 13 | "url": "https://public.podcastindex.org/podcastindex_feeds.db.tgz", |
14 | 14 | "format": "tar.gz (SQLite)", |
15 | 15 | "cadence": "weekly", |
16 | | - "description": "Every feed currently being polled, with title, URL, owner, iTunes ID, host, language, categories, generator, and lastest-episode timestamps. The most heavily used artifact downstream — most third-party mirrors of the Podcast Index data start here." |
| 16 | + "description": "Every feed currently being polled, with title, URL, owner, iTunes ID, host, language, categories, generator, and lastest-episode timestamps. The most heavily used artifact downstream - most third-party mirrors of the Podcast Index data start here." |
17 | 17 | }, |
18 | 18 | { |
19 | | - "name": "Dead feeds — CSV (id only)", |
| 19 | + "name": "Dead feeds - CSV (id only)", |
20 | 20 | "url": "https://public.podcastindex.org/podcastindex_dead_feeds.csv", |
21 | 21 | "format": "CSV", |
22 | 22 | "cadence": "daily", |
23 | 23 | "description": "Lightweight CSV of dead feed IDs and the ID of the feed they duplicate (if any). Use this if you only need to reconcile your own list of feeds against the dead set." |
24 | 24 | }, |
25 | 25 | { |
26 | | - "name": "Problematic feeds — CSV", |
| 26 | + "name": "Problematic feeds - CSV", |
27 | 27 | "url": "https://public.podcastindex.org/podcastindex_problematic_feeds.csv", |
28 | 28 | "format": "CSV", |
29 | 29 | "cadence": "daily", |
|
37 | 37 | "description": "Curated and computed lists derived from podcast 2.0 tags and feed metadata.", |
38 | 38 | "datasets": [ |
39 | 39 | { |
40 | | - "name": "Recommendations — all media", |
| 40 | + "name": "Recommendations - all media", |
41 | 41 | "url": "https://public.podcastindex.org/recommendations.json", |
42 | 42 | "format": "JSON", |
43 | 43 | "cadence": "daily", |
44 | 44 | "description": "Show recommendations mined from <podcast:podroll> tags across the whole index, ranked by mention count." |
45 | 45 | }, |
46 | 46 | { |
47 | | - "name": "Recommendations — video only", |
| 47 | + "name": "Recommendations - video only", |
48 | 48 | "url": "https://public.podcastindex.org/recommendations_video.json", |
49 | 49 | "format": "JSON", |
50 | 50 | "cadence": "daily", |
51 | 51 | "description": "The same recommendation graph, filtered to feeds whose <podcast:medium> or content profile marks them as video." |
52 | 52 | }, |
53 | 53 | { |
54 | | - "name": "Recommendations — music only", |
| 54 | + "name": "Recommendations - music only", |
55 | 55 | "url": "https://public.podcastindex.org/recommendations_music.json", |
56 | 56 | "format": "JSON", |
57 | 57 | "cadence": "daily", |
58 | 58 | "description": "The same recommendation graph, filtered to feeds whose <podcast:medium> or content profile marks them as music." |
59 | 59 | }, |
60 | 60 | { |
61 | | - "name": "Value-enabled feeds — CSV", |
| 61 | + "name": "Value-enabled feeds - CSV", |
62 | 62 | "url": "https://public.podcastindex.org/valueEnabledFeeds.csv", |
63 | 63 | "format": "CSV", |
64 | 64 | "cadence": "daily", |
|
79 | 79 | "description": "Time-series counts and rolling new-feed reports.", |
80 | 80 | "datasets": [ |
81 | 81 | { |
82 | | - "name": "24-hour feed report — HTML", |
| 82 | + "name": "24-hour feed report - HTML", |
83 | 83 | "url": "https://public.podcastindex.org/24hourFeedReport.html", |
84 | 84 | "format": "HTML", |
85 | 85 | "cadence": "daily", |
86 | 86 | "description": "Human-readable daily report: counts of new feeds added in the last 24 hours, top generators, hour-by-hour add rate, and keyword-based scoring of the new-arrival mix." |
87 | 87 | }, |
88 | 88 | { |
89 | | - "name": "Newly-added feeds (last 24h) — CSV", |
| 89 | + "name": "Newly-added feeds (last 24h) - CSV", |
90 | 90 | "url": "https://public.podcastindex.org/newlyAddedFeeds24hours.csv", |
91 | 91 | "format": "CSV", |
92 | 92 | "cadence": "daily", |
|
104 | 104 | "url": "https://stats.podcastindex.org/daily_counts.json", |
105 | 105 | "format": "JSON", |
106 | 106 | "cadence": "daily", |
107 | | - "description": "Day-bucketed aggregate counts with a longer retention window than the hourly file — better for long-term trend lines." |
| 107 | + "description": "Day-bucketed aggregate counts with a longer retention window than the hourly file - better for long-term trend lines." |
108 | 108 | } |
109 | 109 | ] |
110 | 110 | }, |
|
121 | 121 | "description": "Plain-text list of Hive blockchain RPC nodes that have recently passed a health check. Consumed by Podping listeners that need a working node to subscribe to." |
122 | 122 | }, |
123 | 123 | { |
124 | | - "name": "Live tracking firehose — current window", |
| 124 | + "name": "Live tracking firehose - current window", |
125 | 125 | "url": "https://tracking.podcastindex.org/current", |
126 | 126 | "format": "JSON", |
127 | 127 | "cadence": "every few minutes", |
|
0 commit comments