| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | /* | 
					
						
							|  |  |  |    GoToSocial | 
					
						
							| 
									
										
										
										
											2021-12-20 18:42:19 +01:00
										 |  |  |    Copyright (C) 2021-2022 GoToSocial Authors admin@gotosocial.org | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |    This program is free software: you can redistribute it and/or modify | 
					
						
							|  |  |  |    it under the terms of the GNU Affero General Public License as published by | 
					
						
							|  |  |  |    the Free Software Foundation, either version 3 of the License, or | 
					
						
							|  |  |  |    (at your option) any later version. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |    This program is distributed in the hope that it will be useful, | 
					
						
							|  |  |  |    but WITHOUT ANY WARRANTY; without even the implied warranty of | 
					
						
							|  |  |  |    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | 
					
						
							|  |  |  |    GNU Affero General Public License for more details. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |    You should have received a copy of the GNU Affero General Public License | 
					
						
							|  |  |  |    along with this program.  If not, see <http://www.gnu.org/licenses/>. | 
					
						
							|  |  |  | */ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | package text | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import ( | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	"bytes" | 
					
						
							| 
									
										
										
										
											2021-08-25 15:34:33 +02:00
										 |  |  | 	"context" | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 	"net/url" | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	"strings" | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	"github.com/superseriousbusiness/gotosocial/internal/regexes" | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // FindLinks parses the given string looking for recognizable URLs (including scheme). | 
					
						
							|  |  |  | // It returns a list of those URLs, without changing the string, or an error if something goes wrong. | 
					
						
							|  |  |  | // If no URLs are found within the given string, an empty slice and nil will be returned. | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | func FindLinks(in string) []*url.URL { | 
					
						
							|  |  |  | 	var urls []*url.URL | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  | 	// bail already if we don't find anything | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	found := regexes.LinkScheme.FindAllString(in, -1) | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 	if len(found) == 0 { | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 		return nil | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	urlmap := map[string]struct{}{} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 	// for each string we find, we want to parse it into a URL if we can | 
					
						
							|  |  |  | 	// if we fail to parse it, just ignore this match and continue | 
					
						
							|  |  |  | 	for _, f := range found { | 
					
						
							|  |  |  | 		u, err := url.Parse(f) | 
					
						
							|  |  |  | 		if err != nil { | 
					
						
							|  |  |  | 			continue | 
					
						
							|  |  |  | 		} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 		// Calculate string | 
					
						
							|  |  |  | 		ustr := u.String() | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 		if _, ok := urlmap[ustr]; !ok { | 
					
						
							|  |  |  | 			// Has not been encountered yet | 
					
						
							|  |  |  | 			urls = append(urls, u) | 
					
						
							|  |  |  | 			urlmap[ustr] = struct{}{} | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 		} | 
					
						
							|  |  |  | 	} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	return urls | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | // ReplaceLinks replaces all detected links in a piece of text with their HTML (href) equivalents. | 
					
						
							|  |  |  | // Note: because Go doesn't allow negative lookbehinds in regex, it's possible that an already-formatted | 
					
						
							|  |  |  | // href will end up double-formatted, if the text you pass here contains one or more hrefs already. | 
					
						
							|  |  |  | // To avoid this, you should sanitize any HTML out of text before you pass it into this function. | 
					
						
							| 
									
										
										
										
											2021-08-25 15:34:33 +02:00
										 |  |  | func (f *formatter) ReplaceLinks(ctx context.Context, in string) string { | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 	return regexes.ReplaceAllStringFunc(regexes.LinkScheme, in, func(urlString string, buf *bytes.Buffer) string { | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 		thisURL, err := url.Parse(urlString) | 
					
						
							|  |  |  | 		if err != nil { | 
					
						
							|  |  |  | 			return urlString // we can't parse it as a URL so don't replace it | 
					
						
							|  |  |  | 		} | 
					
						
							| 
									
										
										
										
											2022-05-07 16:55:27 +01:00
										 |  |  | 		// <a href="thisURL.String()" rel="noopener">urlString</a> | 
					
						
							|  |  |  | 		urlString = thisURL.String() | 
					
						
							|  |  |  | 		buf.WriteString(`<a href="`) | 
					
						
							|  |  |  | 		buf.WriteString(thisURL.String()) | 
					
						
							|  |  |  | 		buf.WriteString(`" rel="noopener">`) | 
					
						
							|  |  |  | 		urlString = strings.TrimPrefix(urlString, thisURL.Scheme) | 
					
						
							|  |  |  | 		urlString = strings.TrimPrefix(urlString, "://") | 
					
						
							|  |  |  | 		buf.WriteString(urlString) | 
					
						
							|  |  |  | 		buf.WriteString(`</a>`) | 
					
						
							|  |  |  | 		return buf.String() | 
					
						
							| 
									
										
										
										
											2021-07-28 11:42:26 +02:00
										 |  |  | 	}) | 
					
						
							|  |  |  | } |