import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class Example {
public static void main(String[] args) {
final String regex = "<a([^>]+?)href\\s*=\\s*(\"|'|\\s?)(.+?)\\2(?=\\s{1}|>)";
final String string = "<a href=/pesho></a>\n"
+ "<a href='Ilia'></a>\n"
+ "<a class=\"bull\" href=\"http://super-href/dot.com\"></a>\n"
+ "<a href=/softuni.bg class=\"danger'></a>\n\n"
+ "<!DOCTYPE html>\n"
+ "<html>\n"
+ "<head>\n"
+ " <title>Hyperlinks</title>\n"
+ " <link href=\"theme.css\" rel=\"stylesheet\" />\n"
+ "</head>\n"
+ "<body>\n"
+ "<ul><li><a href=\"/\" id=\"home\">Home</a></li><li><a\n"
+ " class=\"selected\" href=/courses>Courses</a>\n"
+ "</li><li><a href = \n"
+ "'/forum' >Forum</a></li><li><a class=\"href\"\n"
+ "onclick=\"go()\" href= \"#\">Forum</a></li>\n"
+ "<li><a id=\"js\" href =\n"
+ "\"javascript:alert('hi yo')\" class=\"new\">click</a></li>\n"
+ "<li><a id='nakov' href =\n"
+ "http://www.nakov.com class='new'>nak</a></li></ul>\n"
+ "<a href=\"#empty\"></a>\n"
+ "<a id=\"href\">href='fake'<img src='http://abv.bg/i.gif' \n"
+ "alt='abv'/></a><a href=\"#\"><a href='hello'></a>\n"
+ "<!-- This code is commented:\n"
+ " <a href=\"#commented\">commentex hyperlink</a> -->\n"
+ "</body>\n"
+ "END";
final Pattern pattern = Pattern.compile(regex);
final Matcher matcher = pattern.matcher(string);
while (matcher.find()) {
System.out.println("Full match: " + matcher.group(0));
for (int i = 1; i <= matcher.groupCount(); i++) {
System.out.println("Group " + i + ": " + matcher.group(i));
}
}
}
}
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Java, please visit: https://docs.oracle.com/javase/7/docs/api/java/util/regex/Pattern.html