2023-04-06 12:19:55 +01:00
|
|
|
// GoToSocial
|
|
|
|
// Copyright (C) GoToSocial Authors admin@gotosocial.org
|
|
|
|
// SPDX-License-Identifier: AGPL-3.0-or-later
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
package ap
|
|
|
|
|
|
|
|
import (
|
|
|
|
"github.com/superseriousbusiness/activity/pub"
|
|
|
|
"github.com/superseriousbusiness/activity/streams"
|
2023-08-11 13:40:11 +01:00
|
|
|
"github.com/superseriousbusiness/gotosocial/internal/text"
|
2023-04-06 12:19:55 +01:00
|
|
|
)
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
/*
|
|
|
|
NORMALIZE INCOMING
|
|
|
|
The below functions should be called to normalize the content
|
|
|
|
of messages *COMING INTO* GoToSocial via the federation API,
|
|
|
|
either as the result of delivery from a remote instance to this
|
|
|
|
instance, or as a result of this instance doing an http call to
|
|
|
|
another instance to dereference something.
|
|
|
|
*/
|
|
|
|
|
|
|
|
// NormalizeIncomingActivityObject normalizes the 'object'.'content' field of the given Activity.
|
2023-04-06 12:19:55 +01:00
|
|
|
//
|
|
|
|
// The rawActivity map should the freshly deserialized json representation of the Activity.
|
|
|
|
//
|
2023-05-09 11:16:10 +01:00
|
|
|
// This function is a noop if the type passed in is anything except a Create or Update with a Statusable or Accountable as its Object.
|
|
|
|
func NormalizeIncomingActivityObject(activity pub.Activity, rawJSON map[string]interface{}) {
|
|
|
|
if typeName := activity.GetTypeName(); typeName != ActivityCreate && typeName != ActivityUpdate {
|
|
|
|
// Only interested in Create or Update right now.
|
2023-04-06 12:19:55 +01:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
withObject, ok := activity.(WithObject)
|
|
|
|
if !ok {
|
|
|
|
// Create was not a WithObject.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
createObject := withObject.GetActivityStreamsObject()
|
|
|
|
if createObject == nil {
|
|
|
|
// No object set.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if createObject.Len() != 1 {
|
|
|
|
// Not interested in Object arrays.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// We now know length is 1 so get the first
|
2023-05-09 11:16:10 +01:00
|
|
|
// item from the iter. We need this to be
|
|
|
|
// a Statusable or Accountable if we're to continue.
|
2023-04-06 12:19:55 +01:00
|
|
|
i := createObject.At(0)
|
|
|
|
if i == nil {
|
|
|
|
// This is awkward.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
t := i.GetType()
|
|
|
|
if t == nil {
|
|
|
|
// This is also awkward.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
switch t.GetTypeName() {
|
|
|
|
case ObjectArticle, ObjectDocument, ObjectImage, ObjectVideo, ObjectNote, ObjectPage, ObjectEvent, ObjectPlace, ObjectProfile:
|
|
|
|
statusable, ok := t.(Statusable)
|
|
|
|
if !ok {
|
|
|
|
// Object is not Statusable;
|
|
|
|
// we're not interested.
|
|
|
|
return
|
|
|
|
}
|
2023-04-06 12:19:55 +01:00
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
rawObject, ok := rawJSON["object"]
|
|
|
|
if !ok {
|
|
|
|
// No object in raw map.
|
|
|
|
return
|
|
|
|
}
|
2023-04-06 12:19:55 +01:00
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
rawStatusableJSON, ok := rawObject.(map[string]interface{})
|
|
|
|
if !ok {
|
|
|
|
// Object wasn't a json object.
|
|
|
|
return
|
|
|
|
}
|
2023-04-06 12:19:55 +01:00
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
// Normalize everything we can on the statusable.
|
|
|
|
NormalizeIncomingContent(statusable, rawStatusableJSON)
|
|
|
|
NormalizeIncomingAttachments(statusable, rawStatusableJSON)
|
|
|
|
NormalizeIncomingSummary(statusable, rawStatusableJSON)
|
|
|
|
NormalizeIncomingName(statusable, rawStatusableJSON)
|
|
|
|
case ActorApplication, ActorGroup, ActorOrganization, ActorPerson, ActorService:
|
|
|
|
accountable, ok := t.(Accountable)
|
|
|
|
if !ok {
|
|
|
|
// Object is not Accountable;
|
|
|
|
// we're not interested.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
rawObject, ok := rawJSON["object"]
|
|
|
|
if !ok {
|
|
|
|
// No object in raw map.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
rawAccountableJSON, ok := rawObject.(map[string]interface{})
|
|
|
|
if !ok {
|
|
|
|
// Object wasn't a json object.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Normalize everything we can on the accountable.
|
|
|
|
NormalizeIncomingSummary(accountable, rawAccountableJSON)
|
|
|
|
}
|
2023-04-06 12:19:55 +01:00
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
// NormalizeIncomingContent replaces the Content of the given item
|
2023-08-11 13:40:11 +01:00
|
|
|
// with the sanitized version of the raw 'content' value from the
|
|
|
|
// raw json object map.
|
2023-04-06 12:19:55 +01:00
|
|
|
//
|
2023-04-26 16:17:22 +01:00
|
|
|
// noop if there was no content in the json object map or the
|
|
|
|
// content was not a plain string.
|
2023-05-09 11:16:10 +01:00
|
|
|
func NormalizeIncomingContent(item WithSetContent, rawJSON map[string]interface{}) {
|
2023-04-26 16:17:22 +01:00
|
|
|
rawContent, ok := rawJSON["content"]
|
2023-04-06 12:19:55 +01:00
|
|
|
if !ok {
|
2023-04-26 16:17:22 +01:00
|
|
|
// No content in rawJSON.
|
2023-04-06 12:19:55 +01:00
|
|
|
// TODO: In future we might also
|
|
|
|
// look for "contentMap" property.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-04-26 16:17:22 +01:00
|
|
|
content, ok := rawContent.(string)
|
2023-04-06 12:19:55 +01:00
|
|
|
if !ok {
|
|
|
|
// Not interested in content arrays.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-08-11 13:40:11 +01:00
|
|
|
// Content should be HTML encoded by default:
|
|
|
|
// https://www.w3.org/TR/activitystreams-vocabulary/#dfn-content
|
|
|
|
//
|
|
|
|
// TODO: sanitize differently based on mediaType.
|
|
|
|
// https://www.w3.org/TR/activitystreams-vocabulary/#dfn-mediatype
|
|
|
|
content = text.SanitizeToHTML(content)
|
|
|
|
content = text.MinifyHTML(content)
|
|
|
|
|
2023-04-26 16:17:22 +01:00
|
|
|
// Set normalized content property from the raw string;
|
|
|
|
// this replaces any existing content property on the item.
|
2023-04-06 12:19:55 +01:00
|
|
|
contentProp := streams.NewActivityStreamsContentProperty()
|
2023-04-26 16:17:22 +01:00
|
|
|
contentProp.AppendXMLSchemaString(content)
|
|
|
|
item.SetActivityStreamsContent(contentProp)
|
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
// NormalizeIncomingAttachments normalizes all attachments (if any) of the given
|
|
|
|
// item, replacing the 'name' (aka content warning) field of each attachment
|
2023-08-11 13:40:11 +01:00
|
|
|
// with the raw 'name' value from the raw json object map, and doing sanitization
|
|
|
|
// on the result.
|
2023-04-26 16:17:22 +01:00
|
|
|
//
|
|
|
|
// noop if there are no attachments; noop if attachment is not a format
|
|
|
|
// we can understand.
|
2023-05-09 11:16:10 +01:00
|
|
|
func NormalizeIncomingAttachments(item WithAttachment, rawJSON map[string]interface{}) {
|
2023-04-26 16:17:22 +01:00
|
|
|
rawAttachments, ok := rawJSON["attachment"]
|
|
|
|
if !ok {
|
|
|
|
// No attachments in rawJSON.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Convert to slice if not already,
|
|
|
|
// so we can iterate through it.
|
|
|
|
var attachments []interface{}
|
|
|
|
if attachments, ok = rawAttachments.([]interface{}); !ok {
|
|
|
|
attachments = []interface{}{rawAttachments}
|
|
|
|
}
|
|
|
|
|
|
|
|
attachmentProperty := item.GetActivityStreamsAttachment()
|
|
|
|
if attachmentProperty == nil {
|
|
|
|
// Nothing to do here.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if l := attachmentProperty.Len(); l == 0 || l != len(attachments) {
|
|
|
|
// Mismatch between item and
|
|
|
|
// JSON, can't normalize.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// Keep an index of where we are in the iter;
|
|
|
|
// we need this so we can modify the correct
|
|
|
|
// attachment, in case of multiples.
|
|
|
|
i := -1
|
|
|
|
|
|
|
|
for iter := attachmentProperty.Begin(); iter != attachmentProperty.End(); iter = iter.Next() {
|
|
|
|
i++
|
|
|
|
|
|
|
|
t := iter.GetType()
|
|
|
|
if t == nil {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
attachmentable, ok := t.(Attachmentable)
|
|
|
|
if !ok {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
rawAttachment, ok := attachments[i].(map[string]interface{})
|
|
|
|
if !ok {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
NormalizeIncomingName(attachmentable, rawAttachment)
|
2023-04-26 16:17:22 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
// NormalizeIncomingSummary replaces the Summary of the given item
|
2023-08-11 13:40:11 +01:00
|
|
|
// with the sanitized version of the raw 'summary' value from the
|
|
|
|
// raw json object map.
|
2023-04-26 16:17:22 +01:00
|
|
|
//
|
|
|
|
// noop if there was no summary in the json object map or the
|
|
|
|
// summary was not a plain string.
|
2023-05-09 11:16:10 +01:00
|
|
|
func NormalizeIncomingSummary(item WithSetSummary, rawJSON map[string]interface{}) {
|
2023-04-26 16:17:22 +01:00
|
|
|
rawSummary, ok := rawJSON["summary"]
|
|
|
|
if !ok {
|
|
|
|
// No summary in rawJSON.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
summary, ok := rawSummary.(string)
|
|
|
|
if !ok {
|
|
|
|
// Not interested in non-string summary.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-08-11 13:40:11 +01:00
|
|
|
// Summary should be HTML encoded:
|
|
|
|
// https://www.w3.org/TR/activitystreams-vocabulary/#dfn-summary
|
|
|
|
summary = text.SanitizeToHTML(summary)
|
|
|
|
summary = text.MinifyHTML(summary)
|
|
|
|
|
2023-04-26 16:17:22 +01:00
|
|
|
// Set normalized summary property from the raw string; this
|
|
|
|
// will replace any existing summary property on the item.
|
|
|
|
summaryProp := streams.NewActivityStreamsSummaryProperty()
|
|
|
|
summaryProp.AppendXMLSchemaString(summary)
|
|
|
|
item.SetActivityStreamsSummary(summaryProp)
|
|
|
|
}
|
|
|
|
|
2023-05-09 11:16:10 +01:00
|
|
|
// NormalizeIncomingName replaces the Name of the given item
|
2023-04-26 16:17:22 +01:00
|
|
|
// with the raw 'name' value from the raw json object map.
|
|
|
|
//
|
|
|
|
// noop if there was no name in the json object map or the
|
|
|
|
// name was not a plain string.
|
2023-05-09 11:16:10 +01:00
|
|
|
func NormalizeIncomingName(item WithSetName, rawJSON map[string]interface{}) {
|
2023-04-26 16:17:22 +01:00
|
|
|
rawName, ok := rawJSON["name"]
|
|
|
|
if !ok {
|
|
|
|
// No name in rawJSON.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
name, ok := rawName.(string)
|
|
|
|
if !ok {
|
|
|
|
// Not interested in non-string name.
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-08-11 13:40:11 +01:00
|
|
|
// Name *must not* include any HTML markup:
|
|
|
|
// https://www.w3.org/TR/activitystreams-vocabulary/#dfn-name
|
|
|
|
//
|
|
|
|
// todo: We probably want to update this to allow
|
|
|
|
// *escaped* HTML markup, but for now just nuke it.
|
|
|
|
name = text.SanitizeToPlaintext(name)
|
|
|
|
|
2023-04-26 16:17:22 +01:00
|
|
|
// Set normalized name property from the raw string; this
|
|
|
|
// will replace any existing name property on the item.
|
|
|
|
nameProp := streams.NewActivityStreamsNameProperty()
|
|
|
|
nameProp.AppendXMLSchemaString(name)
|
|
|
|
item.SetActivityStreamsName(nameProp)
|
2023-04-06 12:19:55 +01:00
|
|
|
}
|