73e4c1cf28
This was originally authored by @stevesavanna in #707. This commit contains changes and refactors that could not be pushed to the original PR. Changes from #707 - Don't ignore bounce mails missing campaign / subscriber UUIDs. The original behaviour falls back to looking up subscribers by e-mail. - Refactor repetetive header.get + regexp conditions per header into a simpler lookup map. - Trim e-mail header values of `\r`. Closes #707, #763 Co-authored-by: stevesavanna <steven@savannacorp.com>
186 lines
4.8 KiB
Go
186 lines
4.8 KiB
Go
package mailbox
|
|
|
|
import (
|
|
"encoding/json"
|
|
"io"
|
|
"regexp"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/emersion/go-message"
|
|
_ "github.com/emersion/go-message/charset"
|
|
"github.com/knadh/go-pop3"
|
|
"github.com/knadh/listmonk/models"
|
|
)
|
|
|
|
// POP represents a POP mailbox.
|
|
type POP struct {
|
|
opt Opt
|
|
client *pop3.Client
|
|
}
|
|
|
|
type bounceHeaders struct {
|
|
Header string
|
|
Regexp *regexp.Regexp
|
|
}
|
|
|
|
var (
|
|
// List of header to look for in the e-mail body, regexp to fall back to if the header is empty.
|
|
headerLookups = []bounceHeaders{
|
|
{models.EmailHeaderCampaignUUID, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderCampaignUUID + `:\s+?)([a-z0-9\-]{36})`)},
|
|
{models.EmailHeaderSubscriberUUID, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderSubscriberUUID + `:\s+?)([a-z0-9\-]{36})`)},
|
|
{models.EmailHeaderDate, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderDate + `:\s+?)([\w,\,\ ,:,+,-]*(?:\(?:\w*\))?)`)},
|
|
{models.EmailHeaderFrom, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderFrom + `:\s+?)(.*)`)},
|
|
{models.EmailHeaderSubject, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderSubject + `:\s+?)(.*)`)},
|
|
{models.EmailHeaderMessageId, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderMessageId + `:\s+?)(.*)`)},
|
|
{models.EmailHeaderDeliveredTo, regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderDeliveredTo + `:\s+?)(.*)`)},
|
|
}
|
|
|
|
reHdrReceived = regexp.MustCompile(`(?m)(?:^` + models.EmailHeaderReceived + `:\s+?)(.*)`)
|
|
)
|
|
|
|
// NewPOP returns a new instance of the POP mailbox client.
|
|
func NewPOP(opt Opt) *POP {
|
|
return &POP{
|
|
opt: opt,
|
|
client: pop3.New(pop3.Opt{
|
|
Host: opt.Host,
|
|
Port: opt.Port,
|
|
TLSEnabled: opt.TLSEnabled,
|
|
TLSSkipVerify: opt.TLSSkipVerify,
|
|
}),
|
|
}
|
|
}
|
|
|
|
// Scan scans the mailbox and pushes the downloaded messages into the given channel.
|
|
// The messages that are downloaded are deleted from the server. If limit > 0,
|
|
// all messages on the server are downloaded and deleted.
|
|
func (p *POP) Scan(limit int, ch chan models.Bounce) error {
|
|
c, err := p.client.NewConn()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
defer c.Quit()
|
|
|
|
// Authenticate.
|
|
if p.opt.AuthProtocol != "none" {
|
|
if err := c.Auth(p.opt.Username, p.opt.Password); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
// Get the total number of messages on the server.
|
|
count, _, err := c.Stat()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// No messages.
|
|
if count == 0 {
|
|
return nil
|
|
}
|
|
|
|
if limit > 0 && count > limit {
|
|
count = limit
|
|
}
|
|
|
|
// Download messages.
|
|
for id := 1; id <= count; id++ {
|
|
// Retrieve the raw bytes of the message.
|
|
b, err := c.RetrRaw(id)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
// Parse the message.
|
|
m, err := message.Read(b)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
h := m
|
|
|
|
// If this is a multipart message, find the last part.
|
|
if mr := m.MultipartReader(); mr != nil {
|
|
for {
|
|
part, err := mr.NextPart()
|
|
if err == io.EOF {
|
|
break
|
|
} else if err != nil {
|
|
return err
|
|
}
|
|
h = part
|
|
}
|
|
}
|
|
|
|
// Reset the "unread portion" pointer of the message buffer.
|
|
// If you don't do this, you can't read the entire body because the pointer will not point to the beginning.
|
|
b, _ = c.RetrRaw(id)
|
|
|
|
// Lookup headers in the e-mail. If a header isn't found, fall back to regexp lookups.
|
|
hdr := make(map[string]string, 7)
|
|
for _, l := range headerLookups {
|
|
v := h.Header.Get(l.Header)
|
|
|
|
// Not in the header. Try regexp.
|
|
if v == "" {
|
|
if m := l.Regexp.FindAllSubmatch(b.Bytes(), -1); m != nil {
|
|
v = string(m[len(m)-1][1])
|
|
}
|
|
}
|
|
|
|
hdr[l.Header] = strings.TrimSpace(v)
|
|
}
|
|
|
|
// Received is a []string header.
|
|
msgReceived := h.Header.Map()[models.EmailHeaderReceived]
|
|
if len(msgReceived) == 0 {
|
|
if u := reHdrReceived.FindAllSubmatch(b.Bytes(), -1); u != nil {
|
|
for i := 0; i < len(u); i++ {
|
|
msgReceived = append(msgReceived, string(u[i][1]))
|
|
}
|
|
}
|
|
}
|
|
|
|
date, _ := time.Parse("Mon, 02 Jan 2006 15:04:05 -0700", hdr[models.EmailHeaderDate])
|
|
if date.IsZero() {
|
|
date = time.Now()
|
|
}
|
|
|
|
// Additional bounce e-mail metadata.
|
|
meta, _ := json.Marshal(struct {
|
|
From string `json:"from"`
|
|
Subject string `json:"subject"`
|
|
MessageID string `json:"message_id"`
|
|
DeliveredTo string `json:"delivered_to"`
|
|
Received []string `json:"received"`
|
|
}{
|
|
From: hdr[models.EmailHeaderFrom],
|
|
Subject: hdr[models.EmailHeaderSubject],
|
|
MessageID: hdr[models.EmailHeaderMessageId],
|
|
DeliveredTo: hdr[models.EmailHeaderDeliveredTo],
|
|
Received: msgReceived,
|
|
})
|
|
|
|
select {
|
|
case ch <- models.Bounce{
|
|
Type: "hard",
|
|
CampaignUUID: hdr[models.EmailHeaderCampaignUUID],
|
|
SubscriberUUID: hdr[models.EmailHeaderSubscriberUUID],
|
|
Source: p.opt.Host,
|
|
CreatedAt: date,
|
|
Meta: meta,
|
|
}:
|
|
default:
|
|
}
|
|
}
|
|
|
|
// Delete the downloaded messages.
|
|
for id := 1; id <= count; id++ {
|
|
if err := c.Dele(id); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|