HTMLタグを除去する

Pattern pattern = Pattern.compile("<.+?>", Pattern.DOTALL);

Matcher matcher = pattern.matcher("<html><body><p>abc<br>def</p></body></html>");

String string = matcher.replaceAll("");

System.out.println(string);