const regex = new RegExp('(?=<div[ ]class="aawp">) # El primer div debe ser con clase aawp
( # primer grupo (será la base de la recursividad)
#--- Opciones ---#
# Cualquier cosa salvo <> una o más veces
[^<>]+
# Cualquier etiqueta vacía (void element)
| <(?=area|base|br|col|embed|hr
|img|input|link|meta|param|source
|track|wbr)\\w+[^>]*>
# Comentarios html
| <!-- .*? -->
# Cualquier otra etiqueta (puede tener anidación)
# Recursividad con grupo 1 (?1). El grupo 2 se usa para
# cerrar la misma etiqueta original
| <(\\w+)[^>]*>(?1)*</\\2>
)
', 'gms')
const str = `<div class="aawp">
<br>
<div>
<div>asd</div>
</div>
</div>
<div class="aawp">
<div id="aawp-tb-445">
<div class="aawp-tb aawp-tb--desktop aawp-tb--cols-5 aawp-tb--hide-labe">
<a>a</a>
<br />
<img src="abc">
<hr>
</div>
<div class="aawp-tb aawp-tb--desktop aawp-tb--cols-5 aawp-tb--hide-labe">
...
</div>
<div class="aawp-tb aawp-tb--desktop aawp-tb--cols-5 aawp-tb--hide-labe">
...
</div>
</div>
</div>
<div class="aawp">
...
</div>
<div class="aawp">
<div id="aawp-tb-445">
<div class="aawp-tb aawp-tb--desktop aawp-tb--cols-5 aawp-tb--hide-labe">
...
</div>
</div>
</div>
<div class="aawp">
<div> x </div>
<div> x </div>
</div>
`;
// Reset `lastIndex` if this regex is defined globally
// regex.lastIndex = 0;
let m;
while ((m = regex.exec(str)) !== null) {
// This is necessary to avoid infinite loops with zero-width matches
if (m.index === regex.lastIndex) {
regex.lastIndex++;
}
// The result can be accessed through the `m`-variable.
m.forEach((match, groupIndex) => {
console.log(`Found match, group ${groupIndex}: ${match}`);
});
}
Please keep in mind that these code samples are automatically generated and are not guaranteed to work. If you find any syntax errors, feel free to submit a bug report. For a full regex reference for JavaScript, please visit: https://developer.mozilla.org/en/docs/Web/JavaScript/Guide/Regular_Expressions