# HG changeset patch # User Henry S Thompson # Date 1702376913 0 # Node ID f593eacb57b07ab59c231b41f2c5a44ba6851aeb # Parent 38d8baf64ac5f66ddbafc8157b0a7acac53d0170 needed now diff -r 38d8baf64ac5 -r f593eacb57b0 mail-from-inf.el --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mail-from-inf.el Tue Dec 12 10:28:33 2023 +0000 @@ -0,0 +1,271 @@ +(setq my-mail-dir "/disk/scratch/mail" + gnus-your-organization "HCRC, University of Edinburgh" + gnus-default-directory "/afs/inf.ed.ac.uk/user/h/ht" + nnmail-message-id-cache-file "/disk/scratch/gnus/.nnmail-cache" + mail-sources + '((file :path "/disk/scratch/mail/ht_mbox")) + mail-source-crash-box "/tmp/crashbox" ; local disk + nndraft-directory "/disk/scratch/drafts/" + message-auto-save-directory "/disk/scratch/drafts/" +) + +(setq white-subjects "\\b\\(phd\\|ilcc\\)\\b") + +(setq w3c-lists1 + '((list "w3c-xml-schema-\\([a-zA-Z]+\\)\\(\\.w3\\.org\\)?" "xml-schema-\\1") + (list "chairs\\(\\.w3\\.org\\)?" "w3c-chairs" ) + (to "\\(w3c\\|public\\|member\\)-xml-\\([-a-zA-Z]+\\)\\(\\.w3\\.org\\)?" + "xml-\\2" ) + ;(list "w3t-\\([-a-zA-Z]+\\)\\(\\.w3\\.org\\)?" "w3t-\\1") + ;(list "team-\\([-a-zA-Z]+\\)\\(\\.w3\\.org\\)?" "w3-team-\\1") + ;(list "w3c-\\(xsl-wg\\|format\\|i18n-ig\\)\\(\\.w3\\.org\\)?" "w3c-xsl") + (list "w3c-\\([-a-zA-Z]+\\)\\(\\.w3\\.org\\)?" "w3c-\\1") + (list "member-\\(ac-uk\\|access\\)" "w3-member-\\1");[-a-zA-Z]+\\) + (to "public-xpointer-registry\\(-request\\)?" + "xpointer-registry");[-a-zA-Z]+ + (to "public-\\([-a-zA-Z]+\\)" "w3-public-\\1") + (to "w3c-xml-schema-\\([a-zA-Z]+\\)" "xml-schema-\\1") + (to "chairs" "w3c-chairs") + (to "w3c-xml-\\([-a-zA-Z]+\\)" "xml-\\1" ) + (to "www-xml-\\([-a-zA-Z]+\\)" "xml-\\1") + ;(list "www-\\([-a-zA-Z]+\\)" "www-\\1") + ;(to "w3c-\\(xsl-wg\\|format\\|i18n-ig\\)" "w3c-xsl") + ;(to "w3t-\\([-a-zA-Z]+\\)" "w3t-\\1") + ;(to "team-\\([-a-zA-Z]+\\)" "w3-team-\\1") + ;(to "w3c-\\([-a-zA-Z]+\\)" "w3c-\\1") + ;(to "xml-\\([-a-zA-Z]+\\)" "w3c-\\1") + ;(to "member-\\([-a-zA-Z]+\\)" "w3-member-\\1") + ;(to "ercim-\\([-a-zA-Z]+\\)" "ercim-\\1") + ;(to "w3t" "w3t") + )) + +(setq w3c-lists2 + '((to "w3t-archive" "w3t-archive") + (to "w3c-archive" "w3c-archive"))) + +(setq xml-lists1 + '(;(to "xml-uri" "nsuri") + (to ".*editor.*" "xml-rec-comments") + (to "xml-dev" "xml") + (to "xsl-list" "xsl") + ;(to "[Xx]emacs[- ]beta" "xemacs") + (to "xmlschema-dev" "schema-dev") + (to "xproc-dev" "xproc-dev") + ;(to "xml-sig" "xml-python") + ;(to "xml-plenary" "xml-plenary") + )) + +(setq xml-lists2 + '((list "ietf-xml-mime\\.imc\\.org" "xml-mime") + (list "xml-mime\\.ietf\\.org" "xml-mime"))) + +(setq misc-list1 + '(;(from "w3t-\\([a-zA-Z]+\\)-request" "w3t-\\1") + ;(from "w3c-\\([a-zA-Z]+\\)-request" "w3c-\\1") + ;(from "xml-\\([a-zA-Z]+\\)-request" "xml-\\1") + ;(from "p.woolman" "nhs-xml") + (from "Cron Daemon" "cron") + (from ".*@mail.gumtree.com" "personal") + (from ".*@postman.storyworth.com" "storyworth") + ;(from "\\(Richard\\.Kirkham\\|rachel\\.johnson\\|maria\\.papadaki\\|marisol\\.leonen\\|sangeeta\\.tewar\\|abdullah\\.alshamsi\\|.*@buid\\.ac\\.ae\\)" "buid") + (to "www-tag" "tag") + ;(to "webarch@noreply.github.com" "tag") + ;(to "dashboard-hackers" "beagle") + ;(to "pellet-users" "pellet") + (to "tkinter-discuss" "tkinter") + ;(to "sdp-students" "sdp") + (to "fnlp-students" "fnlp") + ;(from "fox@tardis\\.ed\\.ac\\.uk\\|s1505551" "fnlp") + ;(to "anlp-students" "anlp") + ;(from "nbnotifications" "anlp") + ;(: split-on-whole-field "Subject" "Re: MSc Project 18.*" "msc18") + ;(: split-on-whole-field "Subject" ".*\\(FNLP\\|100782021\\).*" "fnlp") + ;(: split-on-whole-field "Subject" ".*SDP \\(MS .\\|final\\) evaluation" "sdpEval") + ;(: split-on-whole-field "Subject" ".*[[]SDP[]] \\(Your evaluation\\|Evaluation deadline\\).*" "sdpEval") + ;(: split-on-whole-field "Subject" ".*SDP.*" "sdp") + ;(: split-on-whole-field "Subject" ".*Welcome to ANLP, action needed.*" "anlp_github") + (: split-on-whole-field "Subject" ".*\\(ANLP\\|Accelerated Natural Language Processing\\).*" "anlp") + (from "ANLP on Piazza" "anlp") + ;(from "FNLP on Piazza" "fnlp") + (from "alopez\\|learn\\|scohen\\|eponti" "anlp") + (from "080202022-3SV1SEM2" "inf1-cg") + (from "INFR111252023-4SV1SEM1" "anlp") + (from "no-reply@piazza.com" "anlp") + (: split-on-whole-field "Subject" ".*Personal Tutor.*" "tutees22") + (: split-on-whole-field "Subject" ".*Course Selection.*" "tutees22") + ;(: split-on-whole-field "Subject" ".*Sutton Trust.*" "inf-recruit") + (: split-on-whole-field "Subject" "mycron .*" "cron") + ;(: split-on-whole-field "Subject" "INF1-Cg experiment.*" "cgx_2013") + (: split-on-whole-field "Subject" ".*[[]urn[]].*" "urn") + (from "\\(106300.457@compuserve.com\\|elizdrummondyoung@gmail.com\\|jcdavey12@btinternet.com\\|andrewdolan@btinternet.com\\|wandbamoyes@btinternet.com\\)" "albertus") + (to "corpus-admin" "corpora") + (: split-on-whole-field "Subject" ".*Albertus.*" "albertus") + (: split-on-whole-field "Subject" ".*\\[corpus-admin\\].*" "corpora") + ;(to ".*@\\(hst\\|hthompson\\|henry\\.thompson\\)\\.name" "personal") + (from "mikereape@.*" "mikereape") + (from "\\(.*@mumble\\.net\\|jar@\\.csail\\.mit\\.edu\\)" "jar") + (from ".*@coulters.io" "belford") + (from ".*@umega.co.uk" "belford") + (to ".*@umega.co.uk" "belford") + (: split-on-whole-field "Subject" ".*belford.*" "belford") + )) + +(setq quaker-list + '((to "quaker-\\(l\\|spectrum\\)" "quaker") + ;(to "quaker-b" "quaker-b") + ;(to "QuakerBYM" "quaker-b") + ;(from "quaker-spectrum-approval" "quaker") + )) + +(setq sms-list + '(;(from "s1513009@.*" "ug4_18");\\|s1536017\\(s1443062\\|s1679328 + ;(from "Y.Chen-258@.*" "msc_19") + ;(from "\\(s1795066\\|s1825415\\|A.M.Magalhaes\\|T.Makino\\|S.Li-93\\|M.Maggiolo\\|ashe\\|Y.Li-242\\|E.J.Martin\\|K.Lohse\\|D.Li-28\\|S.D.Martin-1\\|K.Chen-35\\|J.Norris-3\\|S.Li-80\\|Y.Liu-236\\|J.Chen-114\\|Q.Zeng-3\\|Y.Liu-244\\|P.Guo-1\\|s1582739\\|B.Lun\\|X.Li-143\\|F.Li-17\\|K.R.Lu\\|Z.Li-86\\)@.*" "tutees18") + (from "\\(s1895309\\|s1765180\\|s1764494\\|s1645474\\|s1953043\\|s1651774\\|s1732316\\|s1742667\\)@.*" "tutees20") + )) + +(defalias 'tut20 (read-kbd-macro +"C-x o C-s < RET C-s @ C-b C-x C-x M-w C-x b gnus SPC RET C-s \"tutees20 RET C-r \\\\) RET \\\\| C-y C-a ESC ESC : nil RET ESC C-x M-x ht- 3* set- ht SPC RET C-x C-s C-x b RET C-x o")) + +;;; groups only, comes _after_ split to pers-... for to: ht... +(setq misc-list2 + '(;(to "cogsci.general" "junk") + (from "anrdaemon@yandex.ru\\|gsenopu@gmail.com\\|pradeepan88@hotmail.com" "anr-doom") + ;(to "bp-people" "bp-people") + ;(to "ppelders" "ppelders") + ;(to "7vtw" "7vtw") + (to "\\(apps-review\\|uri-review\\|apps-discuss\\|discuss\\|architecture-discuss\\|appsdir\\|art\\)@[a-z.]*\\(ietf\\|iab\\).org" "ietf") + (to "urn@ietf.org" "urn") + (to "if-people" "if-people") + (to "maptask" "maptask") + ;(to "i18n-sig" "xml-python") + ;(to "spec-prod" "spec-prod") + ;(to "markup" "markup") + ;(to "system-notices" "w3c-sys-notes") + (to "[cC]ygwin" "cygwin") + ;(to "jde@sunsite.dk" "jde") + ;(to "jdee-users@lists.sourceforge.net" "jde") + (to "tagsoup-friends@yahoogroups.com" "tagsoup") + (to "screen-users@gnu.org" "screen") + (from "mailinglist@edinburghrc.co.uk" "erc") + (to "selenium-users" "selenium") + (to "python-list@python.org" "python") + ;(to "ding" "gnus") + ;(to "dssslist" "dsssl") + ;(to "TEI-L" "tei") + (to "\\(announcements\\|unicode\\)@.*[.]unicode[.]org" "unicode") + ;(to "squid-users@lists.squid-cache.org\\|squid-users@squid-cache.org" + ; "squid") + (to "exist-open" "exist") + (list "ilcc-\\([a-zA-Z]+\\)" "ilcc-\\1") + (to "ilcc" "ilcc") + (to ".*lecturers@inf.ed.ac.uk" "inf-teach") + (to "\\(aisyllabus\\|acstaff\\)" "inf-teach") + (to "\\(inf\\)?\\(pg\\|msc\\|teach\\|res\\|staff\\)\@inf\\(ormatics\\)?" + "inf-\\2" ) + ;(to "directors-of-studies" "inf-dos") + (to "common-crawl@googlegroups.com" "ccrawl") + ;(list "inkscape-user\\|openbox\\|ffmpeg-user" "misc-list") + )) + +(defconst ht-spam-res '("bfSPAM" "boSPAM" "edSPAM" "saSPAM" "slSPAM")) + +(setq nnmail-split-fancy + '(| + (to "ht\\+d@inf\\.ed\\.ac\\.uk" "_diary") + (! + (lambda (sres) + (cond + ((or (equal (car sres) "notSPAM") + (white-spam t)) + ;; documentation is wrong, no recursion, + ;; so we do it ourselves :-( + (message "was %s, trying further" sres) + (setq sres (nnmail-split-it ht-compiled-split)) + (log-good-sender sres) + sres) + ((member (car sres) ht-spam-res) + sres) + (t ; shouldn't happen! + (message "Shouldn't happen in nnmail-split-fancy %s" sres) + sres)) + ) + (| (: split-on-whole-field "Subject" ".*=\\?UTF-8\\(\\?B\\\?\\|.*=[A-F][0-9]=\\).*\\?=.*" "slSPAM") + ("X-Bogosity" "Yes.*" + (| + (From ".*@.*ed\.ac\.uk" "edSPAM") ; NB From not from + ("X-Spam-Score" "0" "boSPAM") + "bfSPAM")) + (: split-on-whole-field "X-Spam-Level" "\\*\\*\\*\\*.*" + "saSPAM") + ("X-Spam-Status" "Yes.*" "saSPAM") + "notSPAM")))) + +(defun set-ht-compiled-split () + "update the mail splitting rules" + (interactive) + (setq ht-compiled-split + (let* ((month + (format-time-string "%Y-%m" (current-time))) + (now-group (concat "group-" month)) + (now-pers (concat "pers-" month))) + `(| + (: split-on-whole-field "Subject" "testing" "junk") + (: ad-spam "adverts") +;;; ("Content-Type" content-spam "gnSPAM") +;;; ("Content-Transfer-Encoding" encoding-spam "gnSPAM") +;;; (: split-on-whole-subj 'subject-spam "gnSPAM") + ;; Special to people who use Yahoo +;;; ("X-YahooFilteredBulk" ".*" "gnSPAM") +;;; (from author-spam "gnSPAM") + ;; A subject with no letters is SPAM +;;; (: split-on-whole-subj "^[^a-zA-Z]+$" "gnSPAM") + ;; It would be cool to check the + ;; date and toss it if it is "old" + (to "\\(w3[ct]\\|www\\|team\\|member\\|public\\|ercim\\)[^ ]*@.*" + (| ,@w3c-lists1 + (to "ht\\|henry\\|\\(h\\.?\\)?thompson?" ,now-pers) + ,@w3c-lists2 + (to "x.*@.*" (| ,@xml-lists1 + (to "ht\\|henry\\|\\(h\\.?\\)?thompson?" ,now-pers) + ,@xml-lists2 + ,now-group)))) + (to "x.*@.*" (| ,@xml-lists1 + (to "ht\\|henry\\|\\(h\\.?\\)?thompson?" ,now-pers) + ,@xml-lists2)) + ,@misc-list1 + (to "ht\\|henry\\|\\(h\\.?\\)?thompson?" + (| (from ".*@sms.ed.ac.uk" (| + ,@sms-list + ,now-pers)) + + ,now-pers)) + (to "quaker.*" (| + ,@quaker-list + ,now-group)) + ,@misc-list2 + ,now-group + )))) + +(defun quaker-sig-maybe () + (save-excursion + (goto-char (point-max)) + (search-backward "\n-- \n") + (when (looking-at "\n-- \n Henry") + (forward-char 5) + (kill-entire-line 6) + (insert-file "/afs/inf.ed.ac.uk/user/h/ht/.quaker-sig")))) + +(defun straight-to-diary () + (save-excursion + (gnus-group-jump-to-group "nnml+ht:_diary") + (message "s1 %s" (get-text-property (point) 'gnus-group)) + (gnus-group-select-group) + (while (gnus-summary-first-unread-article) + (let ((sco (get-buffer "*Shell Command Output*"))) + (if sco + (kill-buffer sco))) + (gnus-edit-and-move-to-diary '(16 . t))) + (gnus-summary-exit) + ) + )