| /******************************************************************************* |
| * Copyright (c) 2015 David Green. |
| * All rights reserved. This program and the accompanying materials |
| * are made available under the terms of the Eclipse Public License v1.0 |
| * which accompanies this distribution, and is available at |
| * http://www.eclipse.org/legal/epl-v10.html |
| * |
| * Contributors: |
| * David Green - initial API and implementation |
| *******************************************************************************/ |
| |
| package org.eclipse.mylyn.internal.wikitext.commonmark.inlines; |
| |
| import java.util.Set; |
| import java.util.regex.Matcher; |
| import java.util.regex.Pattern; |
| |
| import com.google.common.base.Optional; |
| import com.google.common.collect.ImmutableList; |
| import com.google.common.collect.ImmutableSet; |
| import com.google.common.net.UrlEscapers; |
| |
| public class AutoLinkSpan extends SourceSpan { |
| |
| private static final Set<String> SCHEMES = ImmutableSet.of("coap", "doi", "javascript", "aaa", "aaas", "about", |
| "acap", "cap", "cid", "crid", "data", "dav", "dict", "dns", "file", "ftp", "geo", "go", "gopher", "h323", |
| "http", "https", "iax", "icap", "im", "imap", "info", "ipp", "iris", "iris.beep", "iris.xpc", "iris.xpcs", |
| "iris.lwz", "ldap", "mailto", "mid", "msrp", "msrps", "mtqp", "mupdate", "news", "nfs", "ni", "nih", "nntp", |
| "opaquelocktoken", "pop", "pres", "rtsp", "service", "session", "shttp", "sieve", "sip", "sips", "sms", |
| "snmp", "soap.beep", "soap.beeps", "tag", "tel", "telnet", "tftp", "thismessage", "tn3270", "tip", "tv", |
| "urn", "vemmi", "ws", "wss", "xcon", "xcon-userid", "xmlrpc.beep", "xmlrpc.beeps", "xmpp", "z39.50r", |
| "z39.50s", "adiumxtra", "afp", "afs", "aim", "apt", "attachment", "aw", "beshare", "bitcoin", "bolo", |
| "callto", "chrome", "chrome-extension", "com-eventbrite-attendee", "content", "cvs", "dlna-playsingle", |
| "dlna-playcontainer", "dtn", "dvb", "ed2k", "facetime", "feed", "finger", "fish", "gg", "git", |
| "gizmoproject", "gtalk", "hcp", "icon", "ipn", "irc", "irc6", "ircs", "itms", "jar", "jms", "keyparc", |
| "lastfm", "ldaps", "magnet", "maps", "market,message", "mms", "ms-help", "msnim", "mumble", "mvn", "notes", |
| "oid", "palm", "paparazzi", "platform", "proxy", "psyc", "query", "res", "resource", "rmi", "rsync", "rtmp", |
| "secondlife", "sftp", "sgn", "skype", "smb", "soldat", "spotify", "ssh", "steam", "svn", "teamspeak", |
| "things", "udp", "unreal", "ut2004", "ventrilo", "view-source", "webcal", "wtai", "wyciwyg", "xfire", "xri", |
| "ymsgr"); |
| |
| private static final String EMAIL_DOMAIN_PART = "[a-z0-9](?:[a-z0-9-]{0,61}[a-z0-9])?"; |
| |
| private static final String EMAIL_REGEX = "[a-z0-9.!#$%&'*+/=?^_`{|}~-]+@" + EMAIL_DOMAIN_PART + "(?:\\." |
| + EMAIL_DOMAIN_PART + ")*"; |
| |
| private final Pattern linkPattern = createLinkPattern(); |
| |
| @Override |
| public Optional<? extends Inline> createInline(Cursor cursor) { |
| char c = cursor.getChar(); |
| if (c == '<') { |
| Matcher matcher = cursor.matcher(linkPattern); |
| if (matcher.matches()) { |
| String href = matcher.group(1); |
| String link = href; |
| String email = matcher.group(2); |
| if (email != null) { |
| link = "mailto:" + email; |
| } |
| int endOffset = cursor.getOffset(matcher.end(3)); |
| int linkLength = endOffset - cursor.getOffset(); |
| return Optional.of(new Link(cursor.getLineAtOffset(), cursor.getOffset(), linkLength, escapeUri(link), |
| null, ImmutableList.<Inline> of(new Characters(cursor.getLineAtOffset(), cursor.getOffset() + 1, |
| linkLength - 2, href)))); |
| } |
| } |
| return Optional.absent(); |
| } |
| |
| private String escapeUri(String link) { |
| return UrlEscapers.urlFragmentEscaper().escape(link).replace("%23", "#").replace("%25", "%"); |
| } |
| |
| private Pattern createLinkPattern() { |
| String regex = ""; |
| for (String scheme : SCHEMES) { |
| if (regex.isEmpty()) { |
| regex += "<((?:(?:"; |
| } else { |
| regex += "|"; |
| } |
| regex += scheme.replace(".", "\\."); |
| } |
| regex += "):[^\\s>]+)|(" + EMAIL_REGEX + "))(>).*"; |
| return Pattern.compile(regex, Pattern.DOTALL | Pattern.CASE_INSENSITIVE); |
| } |
| } |