rss.lisp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251
  1. (in-package :cl-user)
  2. (defpackage chatikbot.plugins.rss
  3. (:use :cl :chatikbot.common :alexandria))
  4. (in-package :chatikbot.plugins.rss)
  5. (defstruct feed id url title next-fetch (period 300))
  6. (defstruct feed-item feed guid link title description published)
  7. (defparameter *rss-min-period* 60 "Min rss refresh period in seconds")
  8. (defparameter *rss-max-period* 1800 "Max rss refresh period in seconds")
  9. (defparameter *rss-change-rate* 0.1 "Refresh period adjustment rate")
  10. (defun find-rss-links (url)
  11. (handler-case
  12. (multiple-value-bind (root status headers uri) (xml-request url)
  13. (declare (ignore status headers))
  14. (loop for link in (get-by-tag root "link")
  15. when (string= "application/rss+xml" (plump:attribute link "type"))
  16. collect (list (plump:attribute link "title")
  17. (quri:render-uri
  18. (quri:merge-uris
  19. (quri:uri (plump:attribute link "href"))
  20. uri) nil))))
  21. (error (e) (log:error url e))))
  22. (defun build-feed (url)
  23. (let ((root (xml-request url)))
  24. (alexandria:when-let (rss (car (get-by-tag root "rss")))
  25. (make-feed :url url :title (child-text rss "title")))))
  26. (defun adjust-period (period new-items)
  27. "Adjust the period of feed based on whenever there were new items. With clamping"
  28. (let ((diff (round (* period *rss-change-rate*))))
  29. (min *rss-max-period*
  30. (max *rss-min-period*
  31. (- period (* diff (if (zerop new-items) -1 new-items)))))))
  32. (defun need-fetch-p (feed)
  33. (or (null (feed-next-fetch feed))
  34. (local-time:timestamp> (local-time:now) (feed-next-fetch feed))))
  35. (defun refresh-feed (feed &optional (skip-p #'not))
  36. (let* ((items (loop for item in (ignore-errors (fetch-feed-items feed))
  37. unless (funcall skip-p item)
  38. collect item))
  39. (new-period (adjust-period (feed-period feed) (length items))))
  40. (setf (feed-period feed) new-period
  41. (feed-next-fetch feed) (local-time:timestamp+ (local-time:now) new-period :sec))
  42. items))
  43. (defun %send-feeds (chat-id feeds)
  44. (bot-send-message chat-id
  45. (if (null feeds)
  46. "Пока ничего не постим"
  47. (format nil "Постим~%~{~A) ~A: ~A~^~%~}"
  48. (loop for feed in feeds
  49. for index from 1
  50. append (list index (feed-title feed) (feed-url feed)))))
  51. :disable-web-preview 1))
  52. (defun %fetch-new-items (feed)
  53. (loop for item in (refresh-feed feed #'db/rss-item-exists)
  54. do (db/rss-add-item item)
  55. collect item))
  56. (defun %get-feed (url)
  57. (when url
  58. (or (db/rss-get-feed-by-url url)
  59. (alexandria:when-let (feed (build-feed url))
  60. (log:info "Added feed" feed)
  61. (db/rss-add-feed feed)
  62. (%fetch-new-items feed)
  63. feed))))
  64. (defun fetch-feed-items (feed)
  65. (let ((plump:*tag-dispatchers* plump:*xml-tags*))
  66. (loop
  67. for item in (get-by-tag (xml-request (feed-url feed)) "item")
  68. collect (make-feed-item :feed feed
  69. :guid (or (child-text item "guid") (child-text item "link"))
  70. :link (child-text item "link")
  71. :title (clean-text (child-text item "title"))
  72. :description (clean-text (child-text item "description"))
  73. :published
  74. (ignore-errors
  75. (alexandria:when-let
  76. (pub (or (child-text item "pubDate")
  77. (child-text item "published")))
  78. (local-time:universal-to-timestamp
  79. (date-time-parser:parse-date-time pub))))))))
  80. (defun feed-tag (feed)
  81. (let* ((domain (quri:uri-domain (quri:uri (feed-url feed))))
  82. (dot (position #\. domain)))
  83. (when dot (setf domain (subseq domain 0 dot)))
  84. (format nil "#~A" (subst #\_ #\- domain))))
  85. (defun format-feed-item (item)
  86. (format nil "[~A](~A)~@[ @ ~A~]~%~A~%~@[~A~]"
  87. (feed-title (feed-item-feed item))
  88. (feed-item-link item)
  89. (alexandria:when-let (ts (feed-item-published item))
  90. (local-time:format-timestring
  91. nil ts
  92. :format '((:year 2) "-" (:month 2) "-" (:day 2)
  93. " " (:hour 2) ":" (:min 2))))
  94. (feed-item-title item)
  95. (feed-tag (feed-item-feed item))))
  96. (defun feed-next-fetch-unix (feed)
  97. (alexandria:when-let (ts (feed-next-fetch feed))
  98. (local-time:timestamp-to-unix ts)))
  99. (defun feed-item-published-unix (item)
  100. (alexandria:when-let (ts (feed-item-published item))
  101. (local-time:timestamp-to-unix ts)))
  102. ;; Databaase
  103. (def-db-init
  104. (db-execute "create table if not exists rss_feeds (id INTEGER PRIMARY KEY, url, title, next_fetch, period)")
  105. (db-execute "create unique index if not exists rss_feeds_url_idx on rss_feeds (url)")
  106. (db-execute "create table if not exists rss_items (id INTEGER PRIMARY KEY, feed_id REFERENCES rss_feeds, guid, link, title, published)")
  107. (db-execute "create index if not exists rss_items_idx on rss_items (feed_id, guid)")
  108. (db-execute "create table if not exists rss_chat_feeds (chat_id, feed_id REFERENCES rss_feeds)")
  109. (db-execute "create index if not exists rss_chat_feeds_chat_idx on rss_chat_feeds (chat_id)")
  110. (db-execute "create index if not exists rss_chat_feeds_feed_idx on rss_chat_feeds (feed_id)"))
  111. (defun %db/make-feed (row)
  112. (when row
  113. (make-feed :id (nth 0 row)
  114. :url (nth 1 row)
  115. :title (nth 2 row)
  116. :next-fetch (when (nth 3 row) (local-time:unix-to-timestamp (nth 3 row)))
  117. :period (nth 4 row))))
  118. (defun db/rss-get-feed-by-url (url)
  119. (%db/make-feed (car (db-select "select id, url, title, next_fetch, period from rss_feeds where url = ?" url))))
  120. (defun db/rss-add-feed (feed)
  121. (with-slots (url title period) feed
  122. (let ((next-fetch (feed-next-fetch-unix feed)))
  123. (setf (feed-id feed) (db-execute "insert into rss_feeds (url, title, next_fetch, period) values (?, ?, ?, ?)"
  124. url title next-fetch period))
  125. feed)))
  126. (defun db/rss-update-feed (feed)
  127. (with-slots (id title period) feed
  128. (let ((next-fetch (feed-next-fetch-unix feed)))
  129. (db-execute "update rss_feeds set title = ?, next_fetch = ?, period = ? where id = ?"
  130. title next-fetch period id))))
  131. (defun db/rss-get-active-feeds ()
  132. (mapcar #'%db/make-feed
  133. (db-select "select id, url, title, next_fetch, period from rss_feeds where exists (select 1 from rss_chat_feeds where feed_id=id)")))
  134. (defun db/rss-get-chat-feeds (chat-id)
  135. (mapcar #'%db/make-feed
  136. (db-select "select id, url, title, next_fetch, period from rss_feeds where id in (select feed_id from rss_chat_feeds where chat_id = ?)" chat-id)))
  137. (defun db/rss-get-feed-chats (feed)
  138. (with-slots (id) feed
  139. (flatten (db-select "select chat_id from rss_chat_feeds where feed_id = ?" id))))
  140. (defun db/rss-set-chat-feeds (chat-id feeds)
  141. (db-transaction
  142. (db-execute "delete from rss_chat_feeds where chat_id = ?" chat-id)
  143. (dolist (feed feeds)
  144. (with-slots (id) feed
  145. (db-execute "insert into rss_chat_feeds (chat_id, feed_id) values (?, ?)" chat-id id)))))
  146. (defun db/rss-item-exists (item)
  147. (let ((feed-id (feed-id (feed-item-feed item)))
  148. (guid (feed-item-guid item)))
  149. (db-single "select id from rss_items where feed_id = ? and guid = ? limit 1"
  150. feed-id guid)))
  151. (defun db/rss-add-item (item)
  152. (let ((feed-id (feed-id (feed-item-feed item)))
  153. (published (feed-item-published-unix item)))
  154. (with-slots (guid link title) item
  155. (db-execute "insert into rss_items (feed_id, guid, link, title, published) values (?, ?, ?, ?, ?)"
  156. feed-id guid link title published))))
  157. (defun %db/make-feed-item (feed row)
  158. (when row
  159. (make-feed-item :feed feed
  160. :guid (nth 0 row)
  161. :link (nth 1 row)
  162. :title (nth 2 row)
  163. :published (when (nth 3 row) (local-time:unix-to-timestamp (nth 3 row))))))
  164. (defun db/rss-last-feed-items (feed &optional (limit 10))
  165. (with-slots (id) feed
  166. (mapcar #'(lambda (row) (%db/make-feed-item feed row))
  167. (db-select "select guid, link, title, published from rss_items where feed_id = ? order by published desc, id desc limit ?" id limit))))
  168. ;; Cron
  169. (defcron process-feeds ()
  170. (dolist (feed (remove-if-not #'need-fetch-p (db/rss-get-active-feeds)))
  171. (dolist (item (%fetch-new-items feed))
  172. (dolist (*chat-id* (db/rss-get-feed-chats feed))
  173. (bot-send-message (format-feed-item item)
  174. :parse-mode "Markdown"
  175. :disable-web-preview 1)))
  176. (db/rss-update-feed feed))) ;; Update next fetch and period
  177. ;; Hooks
  178. (def-message-cmd-handler handler-cmd-feeds (:feeds)
  179. (bot-send-message
  180. (if (null *args*)
  181. "URL давай"
  182. (format nil "~:[Не нашел RSS там~;~:*~{~{~A - ~A~}~^~%~}~]"
  183. (find-rss-links (car *args*))))
  184. :disable-web-preview 1))
  185. (def-message-cmd-handler handler-cmd-rss (:rss)
  186. (let ((feeds (db/rss-get-chat-feeds *chat-id*)))
  187. (if (null *args*)
  188. (%send-feeds *chat-id* feeds)
  189. (progn
  190. (dolist (url *args*)
  191. (handler-case
  192. (let ((idx (parse-integer url)))
  193. (when (<= idx (length feeds))
  194. (setf feeds (remove (nth (1- idx) feeds) feeds))))
  195. (parse-error ()
  196. (alexandria:when-let (feed (%get-feed
  197. (or (cadar (find-rss-links url))
  198. url)))
  199. (let ((existing (find (feed-url feed) feeds :key #'feed-url :test #'equal)))
  200. (if existing
  201. (setf feeds (remove existing feeds))
  202. (push feed feeds)))))
  203. (error (e) (log:error "~A: ~A" url e))))
  204. (db/rss-set-chat-feeds *chat-id* feeds)
  205. (%send-feeds *chat-id* (db/rss-get-chat-feeds *chat-id*))))))
  206. (def-message-cmd-handler handler-cmd-last-rss (:lastrss)
  207. (let ((feeds (db/rss-get-chat-feeds *chat-id*)))
  208. (if (null *args*)
  209. (%send-feeds *chat-id* feeds)
  210. (let* ((idx (1- (parse-integer (car *args*))))
  211. (limit (min 20 (if (> (length *args*) 1) (parse-integer (second *args*)) 5)))
  212. (items (db/rss-last-feed-items (nth idx feeds) limit)))
  213. (bot-send-message (format nil "~{~A~^~%~%~}"
  214. (mapcar #'format-feed-item items))
  215. :parse-mode "Markdown"
  216. :disable-web-preview 1)))))