import java.util.regex.Matcher;
import java.util.regex.Pattern;
public class Example {
public static void main(String[] args) {
final String regex = "<div id=\"pageContent\">[\\s\\S]*<div id=\"pageContent\">";
final String string = " \"HTML Tidy for Mac OS X (vers 31 October 2006 - Apple Inc. build 15.15), see www.w3.org\">\n\n"
+ " <title>02.00: Page 1</title>\n"
+ " <meta charset=\"utf-8\">\n"
+ " <script type=\"text/javascript\">\n"
+ "var pg_csslibs = []; // CSS Libs for this Page\n"
+ " var pg_jslibs = []; // JS Libs for this Page\n"
+ " </script>\n"
+ " <script src=\"../../global/js/settings.js\" id=\"settingJS\" type=\n"
+ " \"text/javascript\">\n"
+ "</script>\n"
+ "</head>\n\n"
+ "<body>\n"
+ " <div id=\"pageContent\">\n"
+ " <!-- CONTENT GOES HERE -->\n\n"
+ " <div id=\"pageContent\">\n"
+ " <div>\n"
+ " <p><a href=\"pop/02_00_01/02_00_01_pop01.htm\" class=\n"
+ " \"modal-pop\"><strong>Print</strong></a> the Carousel of Progress\n"
+ " Checklist provided below to keep track of your progress\n"
+ " through the <span class=\"lang\" data-term=\n"
+ " \"module_name\">module</span>. It is important that you read\n"
+ " each page and complete all practice activities in every\n"
+ " <span class=\"lang\" data-term=\"lesson_name";
final Pattern pattern = Pattern.compile(regex);
final Matcher matcher = pattern.matcher(string);
if (matcher.find()) {
System.out.println("Full match: " + matcher.group(0));
for (int i = 1; i <= matcher.groupCount(); i++) {
System.out.println("Group " + i + ": " + matcher.group(i));
}
}
}
}
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for Java, please visit: https://docs.oracle.com/javase/7/docs/api/java/util/regex/Pattern.html