Software /
code /
prosody-modules
Changeset
4597:c858c76d0845
mod_tweet_data: New module that fetches and sends tweet data
based on tweet URLs in MUC messages.
author | JC Brand <jc@opkode.com> |
---|---|
date | Tue, 22 Jun 2021 11:41:16 +0200 |
parents | 4596:c406e4bf7ee5 |
children | 4598:09f0911c735d |
files | mod_ogp/README.markdown mod_tweet_data/README.md mod_tweet_data/mod_tweet_data.lua |
diffstat | 3 files changed, 162 insertions(+), 1 deletions(-) [+] |
line wrap: on
line diff
--- a/mod_ogp/README.markdown Sun Jun 20 13:54:23 2021 +0200 +++ b/mod_ogp/README.markdown Tue Jun 22 11:41:16 2021 +0200 @@ -6,7 +6,7 @@ If it finds any, it sends a [XEP-0422 fastening](https://xmpp.org/extensions/xep-0422.html) applied to the original message that looks like: ```xml -<message id="example" from="chatroom@muc.example.org" to="chatroom@muc.example.org"> +<message id="example" from="chatroom@muc.example.org" to="user@chat.example.org/resource"> <apply-to xmlns="urn:xmpp:fasten:0" id="origin-id-X"> <meta xmlns="http://www.w3.org/1999/xhtml" property="og:title" content="The Rock"/> <meta xmlns="http://www.w3.org/1999/xhtml" property="og:url" content="https://www.imdb.com/title/tt0117500/"/>
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mod_tweet_data/README.md Tue Jun 22 11:41:16 2021 +0200 @@ -0,0 +1,34 @@ +# mod_tweet_data + +This module adds [Open Graph Protocol](https://ogp.me) metadata to Twitter.com tweet URLs sent inside a MUC. + +It's similar to [mod_ogp](https://modules.prosody.im/mod_ogp.html) but is adapted specifically to Twitter.com, which doesn't support the [Open Graph Protocol](https://ogp.me). + +When a user sends a tweet URL in a MUC (where the message has its `id` equal to its `origin-id`), this module calls that URL to get the tweet data. +If it finds any, it sends a [XEP-0422 fastening](https://xmpp.org/extensions/xep-0422.html) applied to the original message that looks as follows (note, I haven't used real data here): + +```xml + <message xmlns="jabber:client" to="user@chat.example.org/resource" from="chatroom@muc.example.org" type="groupchat"> + <apply-to xmlns="urn:xmpp:fasten:0" id="82dbc94c-c18a-4e51-a0d5-9fd3a7bfd267"> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:article:author" content="TwitterCritter" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:article:published_time" content="2021-06-22T06:44:20.000Z" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:description" content="I'm in ur twitterz" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:image" content="https://pbs.twimg.com/profile_images/984325764849045505/Ty3F93Ln_normal.jpg" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:title" content="TwitterCritter" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:type" content="tweet" /> + <meta xmlns="http://www.w3.org/1999/xhtml" property="og:url" content="https://twitter.com/TwitterCritter/status/1407227938391707648" /> + </apply-to> + <stanza-id xmlns="urn:xmpp:sid:0" by="chatroom@muc.example.org" id="90e8818d-390a-4c69-a2d8-0fd463fb3366"/> + </message> +``` + +Configuration +------------- + +You'll need to provide a Twitter APIv2 bearer token. + +```lua +Component "muc.example.org" "muc" + modules_enabled = { "tweet_data" } + twitter_apiv2_bearer_token = { "some-very-long-string" } +```
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mod_tweet_data/mod_tweet_data.lua Tue Jun 22 11:41:16 2021 +0200 @@ -0,0 +1,127 @@ +local mod_muc = module:depends("muc") +local http = require "net.http" +local st = require "util.stanza" +local json = require "util.json" +local url_pattern = [[https://twitter.com/%S+/status/%S+]] +local xmlns_fasten = "urn:xmpp:fasten:0" +local xmlns_xhtml = "http://www.w3.org/1999/xhtml" +local twitter_apiv2_bearer_token = module:get_option_string("twitter_apiv2_bearer_token"); + +local function fetch_tweet_data(room, url, tweet_id, origin_id) + if not url then return; end + local options = { + method = "GET"; + headers = { Authorization = "Bearer "..twitter_apiv2_bearer_token; }; + }; + + http.request( + 'https://api.twitter.com/2/tweets/'..tweet_id..'?expansions=author_id&tweet.fields=created_at,text&user.fields=id,name,username,profile_image_url', + options, + function(response_body, response_code, _) + if response_code ~= 200 then + module:log("debug", "Call to %s returned code %s and body %s", url, response_code, response_body) + return; + end + + local response = json.decode(response_body); + if not response then return; end + + local tweet = response['data']; + local author = response['includes']['users'][1]; + + local to = room.jid + local from = room and room.jid or module.host + local fastening = st.message({to = to, from = from, type = 'groupchat'}):tag("apply-to", {xmlns = xmlns_fasten, id = origin_id}) + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:article:author', + content = author['username'] + } + ):up() + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:article:published_time', + content = tweet['created_at'] + } + ):up() + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:description', + content = tweet['text'] + } + ):up() + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:image', + content = author['profile_image_url'] + } + ):up() + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:title', + content = author['username'] + } + ):up() + + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:type', + content = 'tweet' + } + ):up() + fastening:tag( + "meta", + { + xmlns = xmlns_xhtml, + property = 'og:url', + content = 'https://twitter.com/'..author['username']..'/status/'..tweet['id'] + } + ):up() + + mod_muc.get_room_from_jid(room.jid):broadcast_message(fastening) + module:log("debug", tostring(fastening)) + end + ) +end + +local function tweet_handler(event) + local room, stanza = event.room, st.clone(event.stanza) + local body = stanza:get_child_text("body") + + if not body then return; end + + local origin_id = stanza:find("{urn:xmpp:sid:0}origin-id@id") + if not origin_id then return; end + + for url in body:gmatch(url_pattern) do + local _, _, _, tweet_id = string.find(url, "https://twitter.com/(%S+)/status/(%S+)"); + fetch_tweet_data(room, url, tweet_id, origin_id); + end +end + +module:hook("muc-occupant-groupchat", tweet_handler) + + +module:hook("muc-message-is-historic", function (event) + local fastening = event.stanza:get_child('apply-to', xmlns_fasten) + if fastening and fastening:get_child('meta', xmlns_xhtml) then + return true + end +end);