This commit is contained in:
Marius
2025-08-12 10:15:47 +03:00
parent 82950b81a5
commit 1afc7dc29b
2 changed files with 305 additions and 0 deletions

199
input/urls.yaml Normal file
View File

@@ -0,0 +1,199 @@
# This is an example urls.yaml file for urlwatch
# A basic URL job just needs a URL
name: "efacturax"
url: "https://mfinante.gov.ro/web/efactura/informatii-tehnice"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "saft"
url: "https://www.anaf.ro/anaf/internet/ANAF/despre_anaf/strategii_anaf/proiecte_digitalizare/saf_t"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf descarcare declaratii"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/descarcare_declaratii.htm"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D100"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/100.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D101"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/101.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D300"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/300.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D390"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/390.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D394"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/394.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "anaf D205"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/205.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "romfast facturi clienti"
url: "http://10.0.20.122:81/contafinupdate/situatieparteneri/verificare/romfast/clienti"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "bilant 06/2025"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/situatiifinanciare/2025/semestriale/1027_1050_2025.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "bilant 12/2025"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/situatiifinanciare/2025/1002_5_2025.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "bilant 06/2026"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/situatiifinanciare/2026/semestriale/1027_1050_2026.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---
name: "bilant 12/2026"
url: "https://static.anaf.ro/static/10/Anaf/Declaratii_R/situatiifinanciare/2026/1002_5_2026.html"
timeout: 30
max_tries: 3
headers:
User-Agent: "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36"
Accept: "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8"
Accept-Language: "ro-RO,ro;q=0.9,en;q=0.8"
Connection: "keep-alive"
filter:
- html2text
- strip
---