mirror of
				https://github.com/superseriousbusiness/gotosocial.git
				synced 2025-10-31 03:52:24 -05:00 
			
		
		
		
	* [feature] Support Actor URIs for webfinger queries It's now possible to pass an Actor URI as the resource to query for when doing a webfinger query. The code now extracts the username and domain from the URI. The URI needs to be fully qualified, including having a scheme of http or https to be recognised as such. The acct scheme is handled as we used to, including dealing with an erroneous leading @ on the username. We retain the ability to handle resources without a scheme by parsing them again with the acct scheme if the original parse failed. This can happen due to parsing ambiguities when dealing with a string like user@domain.tld:port. * [bugfix] Remove debugging changes * [chore] Make TestExtractNamestring table-driven * [chore] Unnest Trim and Split for readability
		
			
				
	
	
		
			123 lines
		
	
	
	
		
			4.1 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
			
		
		
	
	
			123 lines
		
	
	
	
		
			4.1 KiB
		
	
	
	
		
			Go
		
	
	
	
	
	
| // GoToSocial
 | |
| // Copyright (C) GoToSocial Authors admin@gotosocial.org
 | |
| // SPDX-License-Identifier: AGPL-3.0-or-later
 | |
| //
 | |
| // This program is free software: you can redistribute it and/or modify
 | |
| // it under the terms of the GNU Affero General Public License as published by
 | |
| // the Free Software Foundation, either version 3 of the License, or
 | |
| // (at your option) any later version.
 | |
| //
 | |
| // This program is distributed in the hope that it will be useful,
 | |
| // but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
| // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
| // GNU Affero General Public License for more details.
 | |
| //
 | |
| // You should have received a copy of the GNU Affero General Public License
 | |
| // along with this program.  If not, see <http://www.gnu.org/licenses/>.
 | |
| 
 | |
| package util
 | |
| 
 | |
| import (
 | |
| 	"fmt"
 | |
| 	"net/url"
 | |
| 	"strings"
 | |
| 
 | |
| 	"github.com/superseriousbusiness/gotosocial/internal/regexes"
 | |
| )
 | |
| 
 | |
| // ExtractNamestringParts extracts the username test_user and
 | |
| // the domain example.org from a string like @test_user@example.org.
 | |
| //
 | |
| // If nothing is matched, it will return an error.
 | |
| func ExtractNamestringParts(mention string) (username, host string, err error) {
 | |
| 	matches := regexes.MentionName.FindStringSubmatch(mention)
 | |
| 	switch len(matches) {
 | |
| 	case 2:
 | |
| 		return matches[1], "", nil
 | |
| 	case 3:
 | |
| 		return matches[1], matches[2], nil
 | |
| 	default:
 | |
| 		return "", "", fmt.Errorf("couldn't match mention %s", mention)
 | |
| 	}
 | |
| }
 | |
| 
 | |
| // ExtractWebfingerParts returns the username and domain from either an
 | |
| // account query or an actor URI.
 | |
| //
 | |
| // All implementations in the wild generate webfinger account resource
 | |
| // queries with the "acct" scheme and without a leading "@"" on the username.
 | |
| // This is also the format the "subject" in a webfinger response adheres to.
 | |
| //
 | |
| // Despite this fact, we're being permissive about a single leading @. This
 | |
| // makes a query for acct:user@domain.tld and acct:@user@domain.tld
 | |
| // equivalent. But a query for acct:@@user@domain.tld will have its username
 | |
| // returned with the @ prefix.
 | |
| //
 | |
| // We also permit a resource of user@domain.tld or @user@domain.tld, without
 | |
| // a scheme. In that case it gets interpreted as if it was using the "acct"
 | |
| // scheme.
 | |
| //
 | |
| // When parsing fails, an error is returned.
 | |
| func ExtractWebfingerParts(webfinger string) (username, host string, err error) {
 | |
| 	orig := webfinger
 | |
| 
 | |
| 	u, oerr := url.ParseRequestURI(webfinger)
 | |
| 	if oerr != nil {
 | |
| 		// Most likely reason for failing to parse is if the "acct" scheme was
 | |
| 		// missing but a :port was included. So try an extra time with the scheme.
 | |
| 		u, err = url.ParseRequestURI("acct:" + webfinger)
 | |
| 		if err != nil {
 | |
| 			return "", "", fmt.Errorf("failed to parse %s with acct sheme: %w", orig, oerr)
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| 	if u.Scheme == "http" || u.Scheme == "https" {
 | |
| 		return ExtractWebfingerPartsFromURI(u)
 | |
| 	}
 | |
| 
 | |
| 	if u.Scheme != "acct" {
 | |
| 		return "", "", fmt.Errorf("unsupported scheme: %s for resource: %s", u.Scheme, orig)
 | |
| 	}
 | |
| 
 | |
| 	stripped := strings.TrimPrefix(u.Opaque, "@")
 | |
| 	userDomain := strings.Split(stripped, "@")
 | |
| 	if len(userDomain) != 2 {
 | |
| 		return "", "", fmt.Errorf("failed to extract user and domain from: %s", orig)
 | |
| 	}
 | |
| 	return userDomain[0], userDomain[1], nil
 | |
| }
 | |
| 
 | |
| // ExtractWebfingerPartsFromURI returns the user and domain extracted from
 | |
| // the passed in URI. The URI should be an actor URI.
 | |
| //
 | |
| // The domain returned is the hostname, and the user will be extracted
 | |
| // from either /@test_user or /users/test_user. These two paths match the
 | |
| // "aliasses" we include in our webfinger response and are also present in
 | |
| // our "links".
 | |
| //
 | |
| // Like with ExtractWebfingerParts, we're being permissive about a single
 | |
| // leading @.
 | |
| //
 | |
| // Errors are returned in case we end up with an empty domain or username.
 | |
| func ExtractWebfingerPartsFromURI(uri *url.URL) (username, host string, err error) {
 | |
| 	host = uri.Host
 | |
| 	if host == "" {
 | |
| 		return "", "", fmt.Errorf("failed to extract domain from: %s", uri)
 | |
| 	}
 | |
| 
 | |
| 	// strip any leading slashes
 | |
| 	path := strings.TrimLeft(uri.Path, "/")
 | |
| 	segs := strings.Split(path, "/")
 | |
| 	if segs[0] == "users" {
 | |
| 		username = segs[1]
 | |
| 	} else {
 | |
| 		username = segs[0]
 | |
| 	}
 | |
| 
 | |
| 	username = strings.TrimPrefix(username, "@")
 | |
| 	if username == "" {
 | |
| 		return "", "", fmt.Errorf("failed to extract username from: %s", uri)
 | |
| 	}
 | |
| 
 | |
| 	return
 | |
| }
 |