From 89b15eef57178406326a36ec2b25e853eba25132 Mon Sep 17 00:00:00 2001 From: Ricardo Felgueiras Date: Fri, 24 May 2024 10:52:58 +0100 Subject: [PATCH 1/5] feat(scrapper): add joinef posts scrapper --- src/scrappers/joinef-posts.yml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) create mode 100644 src/scrappers/joinef-posts.yml diff --git a/src/scrappers/joinef-posts.yml b/src/scrappers/joinef-posts.yml new file mode 100644 index 0000000..3bcd39b --- /dev/null +++ b/src/scrappers/joinef-posts.yml @@ -0,0 +1,15 @@ +url: 'https://www.joinef.com/posts/' +header: Posts +listElementsQuery: article +elementParser: + - title: Title + query: .tile__link + type: text + + - title: Categories + query: .tile__categories + type: text + + - title: Link + query: .tile__link + type: link From 76f02dd61810970fd16caa0b5860b658d993be05 Mon Sep 17 00:00:00 2001 From: Ricardo Felgueiras Date: Fri, 24 May 2024 10:58:02 +0100 Subject: [PATCH 2/5] feat(scrapper): add joinef portfolio scrapper --- src/scrappers/joinef-portfolio.yml | 19 +++++++++++++++++++ 1 file changed, 19 insertions(+) create mode 100644 src/scrappers/joinef-portfolio.yml diff --git a/src/scrappers/joinef-portfolio.yml b/src/scrappers/joinef-portfolio.yml new file mode 100644 index 0000000..7918c53 --- /dev/null +++ b/src/scrappers/joinef-portfolio.yml @@ -0,0 +1,19 @@ +url: 'https://www.joinef.com/portfolio/*' +header: Portfolio +listElementsQuery: .tile--company--row +elementParser: + - title: Name + query: .tile__name + type: text + + - title: Description + query: .tile__description + type: text + + - title: Tags + query: .tile__tags + type: text + + - title: Link + query: .tile__link + type: link From 5915b532499890dbdc9e73a9aa5835e06753ba11 Mon Sep 17 00:00:00 2001 From: Ricardo Felgueiras Date: Fri, 24 May 2024 11:37:28 +0100 Subject: [PATCH 3/5] feat(scrapper): add notion templates --- src/scrappers/notion.yml | 15 +++++++++++++++ 1 file changed, 15 insertions(+) create mode 100644 src/scrappers/notion.yml diff --git a/src/scrappers/notion.yml b/src/scrappers/notion.yml new file mode 100644 index 0000000..8779aa9 --- /dev/null +++ b/src/scrappers/notion.yml @@ -0,0 +1,15 @@ +url: https://www.notion.so* +header: Templates +listElementsQuery: .template-grid > section +elementParser: + - title: Title + query: '[class*="UserBaseInfo_textInfoContainer"]' + type: text + + - title: Userbase rights + query: '[class*="templatePreview_userBaseRight"]' + type: text + + - title: Link + query: '[class*="DynamicModal_trigger"]' + type: link From b5b17430a5749c767e78aa87a6137574a01e2355 Mon Sep 17 00:00:00 2001 From: Ricardo Felgueiras Date: Fri, 24 May 2024 12:18:56 +0100 Subject: [PATCH 4/5] feat(scraper): add milanuncios scraper --- src/scrappers/milanuncios.yml | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 src/scrappers/milanuncios.yml diff --git a/src/scrappers/milanuncios.yml b/src/scrappers/milanuncios.yml new file mode 100644 index 0000000..31fc0f6 --- /dev/null +++ b/src/scrappers/milanuncios.yml @@ -0,0 +1,22 @@ +url: https://www.milanuncios.com/* +listElementsQuery: article +elementParser: + - title: Title + query: .ma-AdCardListingV2-TitleLink + type: text + + - title: Price + query: .ma-AdPrice-value + type: text + + - titlte: Address + query: .ma-AdLocation-text + type: text + + - title: Details + query: .ma-AdCardV2-description + type: text + + - title: Link + query: .ma-AdCardListingV2-TitleLink + type: link \ No newline at end of file From 0a290276e592cb71e9fe2f62bbfb7dd6dcdd6864 Mon Sep 17 00:00:00 2001 From: Ricardo Felgueiras Date: Fri, 24 May 2024 12:35:56 +0100 Subject: [PATCH 5/5] feat(scraper): add vrbo.com scraper --- src/scrappers/vrbo.yml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 src/scrappers/vrbo.yml diff --git a/src/scrappers/vrbo.yml b/src/scrappers/vrbo.yml new file mode 100644 index 0000000..3ef22cf --- /dev/null +++ b/src/scrappers/vrbo.yml @@ -0,0 +1,18 @@ +url: https://www.vrbo.com* +listElementsQuery: '[data-stid="lodging-card-responsive"]' +elementParser: + - title: Title + query: h3.uitk-heading + type: text + + - title: Description + query: .uitk-text + type: text + + - title: Price information + query: '[data-test-id="price-summary"]' + type: text + + - title: Link + query: '[data-stid="open-hotel-information"]' + type: link \ No newline at end of file