adiciona suporte a requisição via selenium gurizada

This commit is contained in:
Renan Bernordi 2024-12-07 00:05:51 -03:00
parent a6fc451f0a
commit 2b842a7cd6
10 changed files with 121 additions and 28 deletions

View file

@ -22,6 +22,7 @@
* 'scriptTagRemove' => ['gtm.js', 'ga.js'], // Exclui scripts específicos das regras globais
* 'classElementRemove' => ['subscription'] // Exclui classes específicas das regras globais
* ]
* - useSelenium: Boolean indicando se deve usar Selenium para extração
*/
return [
'nsctotal.com.br' => [
@ -38,6 +39,14 @@ return [
],
'classAttrRemove' => ['wall', 'protected-content', 'cropped-block']
],
'gauchazh.clicrbs.com.br' => [
'classAttrRemove' => [' m-paid-content', 'paid-content-apply'],
'scriptTagRemove' => ['vendors-', 'verdors-'],
'excludeGlobalRules' => [
'classElementRemove' => ['paid-content']
],
'useSelenium' => true
],
'foreignaffairs.com' => [
'customCode' => 'document.addEventListener(\'DOMContentLoaded\', function() {
const dropcapDiv = document.querySelector(\'.article-dropcap\');