2022-01-30 15:27:37 -08:00
|
|
|
// Copyright (c) 2021 Tulir Asokan
|
|
|
|
//
|
|
|
|
// This Source Code Form is subject to the terms of the Mozilla Public
|
|
|
|
// License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
|
|
// file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
|
|
|
|
|
|
package whatsmeow
|
|
|
|
|
|
|
|
import (
|
|
|
|
"crypto/hmac"
|
|
|
|
"crypto/sha256"
|
|
|
|
"encoding/base64"
|
2024-05-23 14:44:31 -07:00
|
|
|
"errors"
|
2022-01-30 15:27:37 -08:00
|
|
|
"fmt"
|
|
|
|
"io"
|
2023-08-05 11:43:19 -07:00
|
|
|
"net"
|
2022-01-30 15:27:37 -08:00
|
|
|
"net/http"
|
2022-06-11 14:07:42 -07:00
|
|
|
"strings"
|
2023-08-05 11:43:19 -07:00
|
|
|
"time"
|
2022-01-30 15:27:37 -08:00
|
|
|
|
2024-05-23 14:44:31 -07:00
|
|
|
"go.mau.fi/util/retryafter"
|
2022-01-30 15:27:37 -08:00
|
|
|
"google.golang.org/protobuf/proto"
|
|
|
|
"google.golang.org/protobuf/reflect/protoreflect"
|
|
|
|
|
|
|
|
waProto "go.mau.fi/whatsmeow/binary/proto"
|
2024-08-27 10:04:05 -07:00
|
|
|
"go.mau.fi/whatsmeow/proto/waMediaTransport"
|
2022-03-12 14:02:04 -08:00
|
|
|
"go.mau.fi/whatsmeow/socket"
|
2022-01-30 15:27:37 -08:00
|
|
|
"go.mau.fi/whatsmeow/util/cbcutil"
|
|
|
|
"go.mau.fi/whatsmeow/util/hkdfutil"
|
|
|
|
)
|
|
|
|
|
|
|
|
// MediaType represents a type of uploaded file on WhatsApp.
|
|
|
|
// The value is the key which is used as a part of generating the encryption keys.
|
|
|
|
type MediaType string
|
|
|
|
|
|
|
|
// The known media types
|
|
|
|
const (
|
|
|
|
MediaImage MediaType = "WhatsApp Image Keys"
|
|
|
|
MediaVideo MediaType = "WhatsApp Video Keys"
|
|
|
|
MediaAudio MediaType = "WhatsApp Audio Keys"
|
|
|
|
MediaDocument MediaType = "WhatsApp Document Keys"
|
|
|
|
MediaHistory MediaType = "WhatsApp History Keys"
|
|
|
|
MediaAppState MediaType = "WhatsApp App State Keys"
|
2022-03-12 14:02:04 -08:00
|
|
|
|
|
|
|
MediaLinkThumbnail MediaType = "WhatsApp Link Thumbnail Keys"
|
2022-01-30 15:27:37 -08:00
|
|
|
)
|
|
|
|
|
|
|
|
// DownloadableMessage represents a protobuf message that contains attachment info.
|
2022-03-12 14:02:04 -08:00
|
|
|
//
|
|
|
|
// All of the downloadable messages inside a Message struct implement this interface
|
|
|
|
// (ImageMessage, VideoMessage, AudioMessage, DocumentMessage, StickerMessage).
|
2022-01-30 15:27:37 -08:00
|
|
|
type DownloadableMessage interface {
|
|
|
|
proto.Message
|
|
|
|
GetDirectPath() string
|
|
|
|
GetMediaKey() []byte
|
2024-08-27 10:04:05 -07:00
|
|
|
GetFileSHA256() []byte
|
|
|
|
GetFileEncSHA256() []byte
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
|
|
|
|
2022-03-12 14:02:04 -08:00
|
|
|
// DownloadableThumbnail represents a protobuf message that contains a thumbnail attachment.
|
|
|
|
//
|
|
|
|
// This is primarily meant for link preview thumbnails in ExtendedTextMessage.
|
|
|
|
type DownloadableThumbnail interface {
|
|
|
|
proto.Message
|
|
|
|
GetThumbnailDirectPath() string
|
2024-08-27 10:04:05 -07:00
|
|
|
GetThumbnailSHA256() []byte
|
|
|
|
GetThumbnailEncSHA256() []byte
|
2022-03-12 14:02:04 -08:00
|
|
|
GetMediaKey() []byte
|
|
|
|
}
|
|
|
|
|
2022-01-30 15:27:37 -08:00
|
|
|
// All the message types that are intended to be downloadable
|
|
|
|
var (
|
2022-03-12 14:02:04 -08:00
|
|
|
_ DownloadableMessage = (*waProto.ImageMessage)(nil)
|
|
|
|
_ DownloadableMessage = (*waProto.AudioMessage)(nil)
|
|
|
|
_ DownloadableMessage = (*waProto.VideoMessage)(nil)
|
|
|
|
_ DownloadableMessage = (*waProto.DocumentMessage)(nil)
|
|
|
|
_ DownloadableMessage = (*waProto.StickerMessage)(nil)
|
2023-01-28 13:57:53 -08:00
|
|
|
_ DownloadableMessage = (*waProto.StickerMetadata)(nil)
|
2022-03-12 14:02:04 -08:00
|
|
|
_ DownloadableMessage = (*waProto.HistorySyncNotification)(nil)
|
|
|
|
_ DownloadableMessage = (*waProto.ExternalBlobReference)(nil)
|
|
|
|
_ DownloadableThumbnail = (*waProto.ExtendedTextMessage)(nil)
|
2022-01-30 15:27:37 -08:00
|
|
|
)
|
|
|
|
|
|
|
|
type downloadableMessageWithLength interface {
|
|
|
|
DownloadableMessage
|
|
|
|
GetFileLength() uint64
|
|
|
|
}
|
|
|
|
|
|
|
|
type downloadableMessageWithSizeBytes interface {
|
|
|
|
DownloadableMessage
|
|
|
|
GetFileSizeBytes() uint64
|
|
|
|
}
|
|
|
|
|
|
|
|
type downloadableMessageWithURL interface {
|
|
|
|
DownloadableMessage
|
|
|
|
GetUrl() string
|
|
|
|
}
|
|
|
|
|
|
|
|
var classToMediaType = map[protoreflect.Name]MediaType{
|
|
|
|
"ImageMessage": MediaImage,
|
|
|
|
"AudioMessage": MediaAudio,
|
|
|
|
"VideoMessage": MediaVideo,
|
|
|
|
"DocumentMessage": MediaDocument,
|
|
|
|
"StickerMessage": MediaImage,
|
2023-01-28 13:57:53 -08:00
|
|
|
"StickerMetadata": MediaImage,
|
2022-01-30 15:27:37 -08:00
|
|
|
|
|
|
|
"HistorySyncNotification": MediaHistory,
|
|
|
|
"ExternalBlobReference": MediaAppState,
|
|
|
|
}
|
|
|
|
|
2022-03-12 14:02:04 -08:00
|
|
|
var classToThumbnailMediaType = map[protoreflect.Name]MediaType{
|
|
|
|
"ExtendedTextMessage": MediaLinkThumbnail,
|
|
|
|
}
|
|
|
|
|
2022-01-30 15:27:37 -08:00
|
|
|
var mediaTypeToMMSType = map[MediaType]string{
|
|
|
|
MediaImage: "image",
|
|
|
|
MediaAudio: "audio",
|
|
|
|
MediaVideo: "video",
|
|
|
|
MediaDocument: "document",
|
|
|
|
MediaHistory: "md-msg-hist",
|
|
|
|
MediaAppState: "md-app-state",
|
2022-03-12 14:02:04 -08:00
|
|
|
|
|
|
|
MediaLinkThumbnail: "thumbnail-link",
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// DownloadAny loops through the downloadable parts of the given message and downloads the first non-nil item.
|
|
|
|
func (cli *Client) DownloadAny(msg *waProto.Message) (data []byte, err error) {
|
2022-03-12 14:02:04 -08:00
|
|
|
if msg == nil {
|
|
|
|
return nil, ErrNothingDownloadableFound
|
|
|
|
}
|
|
|
|
switch {
|
|
|
|
case msg.ImageMessage != nil:
|
|
|
|
return cli.Download(msg.ImageMessage)
|
|
|
|
case msg.VideoMessage != nil:
|
|
|
|
return cli.Download(msg.VideoMessage)
|
|
|
|
case msg.AudioMessage != nil:
|
|
|
|
return cli.Download(msg.AudioMessage)
|
|
|
|
case msg.DocumentMessage != nil:
|
|
|
|
return cli.Download(msg.DocumentMessage)
|
|
|
|
case msg.StickerMessage != nil:
|
|
|
|
return cli.Download(msg.StickerMessage)
|
|
|
|
default:
|
|
|
|
return nil, ErrNothingDownloadableFound
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func getSize(msg DownloadableMessage) int {
|
|
|
|
switch sized := msg.(type) {
|
|
|
|
case downloadableMessageWithLength:
|
|
|
|
return int(sized.GetFileLength())
|
|
|
|
case downloadableMessageWithSizeBytes:
|
|
|
|
return int(sized.GetFileSizeBytes())
|
|
|
|
default:
|
|
|
|
return -1
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-03-12 14:02:04 -08:00
|
|
|
// DownloadThumbnail downloads a thumbnail from a message.
|
|
|
|
//
|
|
|
|
// This is primarily intended for downloading link preview thumbnails, which are in ExtendedTextMessage:
|
2022-11-26 15:42:16 -08:00
|
|
|
//
|
|
|
|
// var msg *waProto.Message
|
|
|
|
// ...
|
|
|
|
// thumbnailImageBytes, err := cli.DownloadThumbnail(msg.GetExtendedTextMessage())
|
2022-03-12 14:02:04 -08:00
|
|
|
func (cli *Client) DownloadThumbnail(msg DownloadableThumbnail) ([]byte, error) {
|
|
|
|
mediaType, ok := classToThumbnailMediaType[msg.ProtoReflect().Descriptor().Name()]
|
|
|
|
if !ok {
|
|
|
|
return nil, fmt.Errorf("%w '%s'", ErrUnknownMediaType, string(msg.ProtoReflect().Descriptor().Name()))
|
|
|
|
} else if len(msg.GetThumbnailDirectPath()) > 0 {
|
2024-08-27 10:04:05 -07:00
|
|
|
return cli.DownloadMediaWithPath(msg.GetThumbnailDirectPath(), msg.GetThumbnailEncSHA256(), msg.GetThumbnailSHA256(), msg.GetMediaKey(), -1, mediaType, mediaTypeToMMSType[mediaType])
|
2022-03-12 14:02:04 -08:00
|
|
|
} else {
|
|
|
|
return nil, ErrNoURLPresent
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetMediaType returns the MediaType value corresponding to the given protobuf message.
|
|
|
|
func GetMediaType(msg DownloadableMessage) MediaType {
|
|
|
|
return classToMediaType[msg.ProtoReflect().Descriptor().Name()]
|
|
|
|
}
|
|
|
|
|
2022-01-30 15:27:37 -08:00
|
|
|
// Download downloads the attachment from the given protobuf message.
|
2022-03-12 14:02:04 -08:00
|
|
|
//
|
|
|
|
// The attachment is a specific part of a Message protobuf struct, not the message itself, e.g.
|
2022-11-26 15:42:16 -08:00
|
|
|
//
|
|
|
|
// var msg *waProto.Message
|
|
|
|
// ...
|
|
|
|
// imageData, err := cli.Download(msg.GetImageMessage())
|
2022-03-12 14:02:04 -08:00
|
|
|
//
|
|
|
|
// You can also use DownloadAny to download the first non-nil sub-message.
|
|
|
|
func (cli *Client) Download(msg DownloadableMessage) ([]byte, error) {
|
2022-01-30 15:27:37 -08:00
|
|
|
mediaType, ok := classToMediaType[msg.ProtoReflect().Descriptor().Name()]
|
|
|
|
if !ok {
|
|
|
|
return nil, fmt.Errorf("%w '%s'", ErrUnknownMediaType, string(msg.ProtoReflect().Descriptor().Name()))
|
|
|
|
}
|
|
|
|
urlable, ok := msg.(downloadableMessageWithURL)
|
2022-06-11 14:07:42 -07:00
|
|
|
var url string
|
|
|
|
var isWebWhatsappNetURL bool
|
|
|
|
if ok {
|
|
|
|
url = urlable.GetUrl()
|
2023-03-09 13:48:00 -08:00
|
|
|
isWebWhatsappNetURL = strings.HasPrefix(url, "https://web.whatsapp.net")
|
2022-06-11 14:07:42 -07:00
|
|
|
}
|
|
|
|
if len(url) > 0 && !isWebWhatsappNetURL {
|
2024-08-27 10:04:05 -07:00
|
|
|
return cli.downloadAndDecrypt(url, msg.GetMediaKey(), mediaType, getSize(msg), msg.GetFileEncSHA256(), msg.GetFileSHA256())
|
2022-01-30 15:27:37 -08:00
|
|
|
} else if len(msg.GetDirectPath()) > 0 {
|
2024-08-27 10:04:05 -07:00
|
|
|
return cli.DownloadMediaWithPath(msg.GetDirectPath(), msg.GetFileEncSHA256(), msg.GetFileSHA256(), msg.GetMediaKey(), getSize(msg), mediaType, mediaTypeToMMSType[mediaType])
|
2022-01-30 15:27:37 -08:00
|
|
|
} else {
|
2022-06-11 14:07:42 -07:00
|
|
|
if isWebWhatsappNetURL {
|
|
|
|
cli.Log.Warnf("Got a media message with a web.whatsapp.net URL (%s) and no direct path", url)
|
|
|
|
}
|
2022-01-30 15:27:37 -08:00
|
|
|
return nil, ErrNoURLPresent
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-05-23 14:44:31 -07:00
|
|
|
func (cli *Client) DownloadFB(transport *waMediaTransport.WAMediaTransport_Integral, mediaType MediaType) ([]byte, error) {
|
|
|
|
return cli.DownloadMediaWithPath(transport.GetDirectPath(), transport.GetFileEncSHA256(), transport.GetFileSHA256(), transport.GetMediaKey(), -1, mediaType, mediaTypeToMMSType[mediaType])
|
|
|
|
}
|
|
|
|
|
2022-03-12 14:02:04 -08:00
|
|
|
// DownloadMediaWithPath downloads an attachment by manually specifying the path and encryption details.
|
|
|
|
func (cli *Client) DownloadMediaWithPath(directPath string, encFileHash, fileHash, mediaKey []byte, fileLength int, mediaType MediaType, mmsType string) (data []byte, err error) {
|
2022-03-31 15:23:19 -07:00
|
|
|
var mediaConn *MediaConn
|
|
|
|
mediaConn, err = cli.refreshMediaConn(false)
|
2022-01-30 15:27:37 -08:00
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("failed to refresh media connections: %w", err)
|
|
|
|
}
|
2022-03-12 14:02:04 -08:00
|
|
|
if len(mmsType) == 0 {
|
|
|
|
mmsType = mediaTypeToMMSType[mediaType]
|
|
|
|
}
|
2022-03-31 15:23:19 -07:00
|
|
|
for i, host := range mediaConn.Hosts {
|
2024-05-23 14:44:31 -07:00
|
|
|
// TODO omit hash for unencrypted media?
|
2022-01-30 15:27:37 -08:00
|
|
|
mediaURL := fmt.Sprintf("https://%s%s&hash=%s&mms-type=%s&__wa-mms=", host.Hostname, directPath, base64.URLEncoding.EncodeToString(encFileHash), mmsType)
|
2022-03-12 14:02:04 -08:00
|
|
|
data, err = cli.downloadAndDecrypt(mediaURL, mediaKey, mediaType, fileLength, encFileHash, fileHash)
|
2024-08-27 10:04:05 -07:00
|
|
|
if err == nil || errors.Is(err, ErrFileLengthMismatch) || errors.Is(err, ErrInvalidMediaSHA256) {
|
2024-05-23 14:44:31 -07:00
|
|
|
return
|
|
|
|
} else if i >= len(mediaConn.Hosts)-1 {
|
|
|
|
return nil, fmt.Errorf("failed to download media from last host: %w", err)
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
2024-05-23 14:44:31 -07:00
|
|
|
// TODO there are probably some errors that shouldn't retry
|
|
|
|
cli.Log.Warnf("Failed to download media: %s, trying with next host...", err)
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2024-08-27 10:04:05 -07:00
|
|
|
func (cli *Client) downloadAndDecrypt(url string, mediaKey []byte, appInfo MediaType, fileLength int, fileEncSHA256, fileSHA256 []byte) (data []byte, err error) {
|
2022-01-30 15:27:37 -08:00
|
|
|
iv, cipherKey, macKey, _ := getMediaKeys(mediaKey, appInfo)
|
|
|
|
var ciphertext, mac []byte
|
2024-08-27 10:04:05 -07:00
|
|
|
if ciphertext, mac, err = cli.downloadPossiblyEncryptedMediaWithRetries(url, fileEncSHA256); err != nil {
|
2022-01-30 15:27:37 -08:00
|
|
|
|
2024-08-27 10:04:05 -07:00
|
|
|
} else if mediaKey == nil && fileEncSHA256 == nil && mac == nil {
|
2024-05-23 14:44:31 -07:00
|
|
|
// Unencrypted media, just return the downloaded data
|
|
|
|
data = ciphertext
|
2022-01-30 15:27:37 -08:00
|
|
|
} else if err = validateMedia(iv, ciphertext, macKey, mac); err != nil {
|
|
|
|
|
|
|
|
} else if data, err = cbcutil.Decrypt(cipherKey, iv, ciphertext); err != nil {
|
|
|
|
err = fmt.Errorf("failed to decrypt file: %w", err)
|
|
|
|
} else if fileLength >= 0 && len(data) != fileLength {
|
|
|
|
err = fmt.Errorf("%w: expected %d, got %d", ErrFileLengthMismatch, fileLength, len(data))
|
2024-08-27 10:04:05 -07:00
|
|
|
} else if len(fileSHA256) == 32 && sha256.Sum256(data) != *(*[32]byte)(fileSHA256) {
|
2022-01-30 15:27:37 -08:00
|
|
|
err = ErrInvalidMediaSHA256
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func getMediaKeys(mediaKey []byte, appInfo MediaType) (iv, cipherKey, macKey, refKey []byte) {
|
|
|
|
mediaKeyExpanded := hkdfutil.SHA256(mediaKey, nil, []byte(appInfo), 112)
|
|
|
|
return mediaKeyExpanded[:16], mediaKeyExpanded[16:48], mediaKeyExpanded[48:80], mediaKeyExpanded[80:]
|
|
|
|
}
|
|
|
|
|
2024-05-23 14:44:31 -07:00
|
|
|
func shouldRetryMediaDownload(err error) bool {
|
|
|
|
var netErr net.Error
|
|
|
|
var httpErr DownloadHTTPError
|
|
|
|
return errors.As(err, &netErr) ||
|
|
|
|
strings.HasPrefix(err.Error(), "stream error:") || // hacky check for http2 errors
|
|
|
|
(errors.As(err, &httpErr) && retryafter.Should(httpErr.StatusCode, true))
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cli *Client) downloadPossiblyEncryptedMediaWithRetries(url string, checksum []byte) (file, mac []byte, err error) {
|
2023-08-05 11:43:19 -07:00
|
|
|
for retryNum := 0; retryNum < 5; retryNum++ {
|
2024-05-23 14:44:31 -07:00
|
|
|
if checksum == nil {
|
|
|
|
file, err = cli.downloadMedia(url)
|
|
|
|
} else {
|
|
|
|
file, mac, err = cli.downloadEncryptedMedia(url, checksum)
|
2023-08-05 11:43:19 -07:00
|
|
|
}
|
2024-05-23 14:44:31 -07:00
|
|
|
if err == nil || !shouldRetryMediaDownload(err) {
|
2023-08-05 11:43:19 -07:00
|
|
|
return
|
|
|
|
}
|
2024-05-23 14:44:31 -07:00
|
|
|
retryDuration := time.Duration(retryNum+1) * time.Second
|
|
|
|
var httpErr DownloadHTTPError
|
|
|
|
if errors.As(err, &httpErr) {
|
|
|
|
retryDuration = retryafter.Parse(httpErr.Response.Header.Get("Retry-After"), retryDuration)
|
|
|
|
}
|
|
|
|
cli.Log.Warnf("Failed to download media due to network error: %w, retrying in %s...", err, retryDuration)
|
|
|
|
time.Sleep(retryDuration)
|
2023-08-05 11:43:19 -07:00
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2024-05-23 14:44:31 -07:00
|
|
|
func (cli *Client) downloadMedia(url string) ([]byte, error) {
|
|
|
|
req, err := http.NewRequest(http.MethodGet, url, nil)
|
2022-03-12 14:02:04 -08:00
|
|
|
if err != nil {
|
2024-05-23 14:44:31 -07:00
|
|
|
return nil, fmt.Errorf("failed to prepare request: %w", err)
|
2022-03-12 14:02:04 -08:00
|
|
|
}
|
|
|
|
req.Header.Set("Origin", socket.Origin)
|
|
|
|
req.Header.Set("Referer", socket.Origin+"/")
|
2024-05-23 14:44:31 -07:00
|
|
|
if cli.MessengerConfig != nil {
|
|
|
|
req.Header.Set("User-Agent", cli.MessengerConfig.UserAgent)
|
|
|
|
}
|
|
|
|
// TODO user agent for whatsapp downloads?
|
|
|
|
resp, err := cli.http.Do(req)
|
2022-01-30 15:27:37 -08:00
|
|
|
if err != nil {
|
2024-05-23 14:44:31 -07:00
|
|
|
return nil, err
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
|
|
|
defer resp.Body.Close()
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
2024-05-23 14:44:31 -07:00
|
|
|
return nil, DownloadHTTPError{Response: resp}
|
2022-01-30 15:27:37 -08:00
|
|
|
}
|
2024-05-23 14:44:31 -07:00
|
|
|
return io.ReadAll(resp.Body)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cli *Client) downloadEncryptedMedia(url string, checksum []byte) (file, mac []byte, err error) {
|
|
|
|
data, err := cli.downloadMedia(url)
|
2022-01-30 15:27:37 -08:00
|
|
|
if err != nil {
|
|
|
|
return
|
|
|
|
} else if len(data) <= 10 {
|
|
|
|
err = ErrTooShortFile
|
|
|
|
return
|
|
|
|
}
|
|
|
|
file, mac = data[:len(data)-10], data[len(data)-10:]
|
|
|
|
if len(checksum) == 32 && sha256.Sum256(data) != *(*[32]byte)(checksum) {
|
|
|
|
err = ErrInvalidMediaEncSHA256
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
func validateMedia(iv, file, macKey, mac []byte) error {
|
|
|
|
h := hmac.New(sha256.New, macKey)
|
|
|
|
h.Write(iv)
|
|
|
|
h.Write(file)
|
|
|
|
if !hmac.Equal(h.Sum(nil)[:10], mac) {
|
|
|
|
return ErrInvalidMediaHMAC
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|