golang remove html tag from string
package utils | |
import ( | |
"regexp" | |
"sort" | |
"strings" | |
) | |
// match html tag and replace it with "" | |
func RemoveHtmlTag(in string) string { | |
// regex to match html tag | |
const pattern = `(<\/?[a-zA-A]+?[^>]*\/?>)*` | |
r := regexp.MustCompile(pattern) | |
groups := r.FindAllString(in, -1) | |
// should replace long string first | |
sort.Slice(groups, func(i, j int) bool { | |
return len(groups[i]) > len(groups[j]) | |
}) | |
for _, group := range groups { | |
if strings.TrimSpace(group) != "" { | |
in = strings.ReplaceAll(in, group, "") | |
} | |
} | |
return in | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment