Skip to content

Latest commit

 

History

History
268 lines (127 loc) · 25.3 KB

EXAMPLES.md

File metadata and controls

268 lines (127 loc) · 25.3 KB

Here are a few random examples on how newslinkrss can be used to generate feeds from several types of sites. They were working (or mostly working!) at the moment this file was created but sites can change at any time and break the feeds.

Sources in English

News

newslinkrss -t 5 -p 'https://apnews.com/article/.+' --follow --with-body --body-csss 'main' -C '.Page-actions, div.Page-below, template, div.Carousel-slides' -C '.Advertisement, div.Enhancement' -X '//a[not(@href) and not(node())]' --author-from-csss 'div.Page-authors span' -Q '^utm_' --title-regex '([^|]+)\s*|' https://apnews.com/
newslinkrss  --follow  -p 'https://www.reuters.com/.+/.+\d{4}-\d{2}-\d{2}.+'  --max-page-length 512  --with-body  --body-xpath '//article'  --body-remove-csss 'div[class*="article-header__toolbar__"], div[class*="article-body__toolbar__"]'  --body-remove-csss 'div[class*="article__read-next__"], div.read-next-panel'  --body-remove-csss 'div[class^="info-content__toolbar__"], div[data-testid="toolbar-container"], *[class^="social-links__container__"]' --require-dates  --title-regex '(.+)\s+\|'  https://www.reuters.com/
newslinkrss -t 5 -n 60 -p '^https://www.washingtonpost.com/.+/\d+/\d+/\d+/.+' --follow --author-from-xpath '//a[@rel="author"]/text()' --with-body --body-csss 'main header h1, main header h2, main header .print-byline, main .article-body' --title-regex '(.*\S)\s*-[^-]*'  -C '.hide-for-print' https://www.washingtonpost.com/
newslinkrss --follow -t 4 -p 'https://www.economist.com/.+/\d{4}/\d{2}/\d{2}/.+' --max-page-length 512 --with-body --body-csss 'article section' --title-regex '(.+)\s*|' --date-from-xpath '//time[@datetime]/@datetime' -C style --require-dates https://www.economist.com/
newslinkrss -p 'https://www.kyivpost.com/post/\d+' -fB --body-csss '.post-lead, div#post-content' --title-from-csss 'h1.post-title' --date-from-csss 'div.post-info' --csss-date-regex '.*([A-Z][a-z]+.*\s\d+,\s+\d+.+[ap]m)'  --author-from-csss 'div.post-info a[href*="/authors/"], a.post-author-name' https://www.kyivpost.com/
newslinkrss  -p 'https://abcnews.go.com/.+/.+(-|id=)\d+' --follow --date-from-xpath '//meta[@property="lastPublishedDate"]/@content' --with-body --body-csss 'div.FITT_Article_main__body' --require-dates --title-regex '(.+)\s*-\s*ABC News' https://abcnews.go.com/
newslinkrss --follow -p '.*//nymag.com/intelligencer/(article|\d+/\d+)/.+\.html' --with-body --body-csss 'article' -C 'aside.newsletter-flex-text' -C 'section.package-list' -C 'div.comments-link' -C 'div.tags' -C 'style' https://nymag.com/intelligencer/
newslinkrss -p 'https://www.nbcnews.com/.+/.+/.+\d+' -i 'https://www.nbcnews.com/select/.+' -i 'https://www.nbcnews.com/[a-z-]+/video/.+' -i 'https://www.nbcnews.com/news/.+/nbc-affiliates.*\d+' --follow --with-body --body-csss 'article' --title-from-csss h1 --date-from-xpath '//time[@datetime]/@datetime' --author-from-csss '.byline-name a[href*="/author/"]' --categories-from-csss 'header .unibrow a span' -C '.ad-container, .article-social-share-top, .byline-thumbnail picture' https://www.nbcnews.com/
newslinkrss -fB -t 4 -p 'https://aviationweek.com/.+/.+/.+' --body-csss 'div.article__header, div.article__body'  --title-from-csss 'h1.page-title' --author-from-csss 'a.article__byline' --date-from-csss 'span.article__date' --categories-from-csss 'ul.tags li a' -i 'https://aviationweek.com/(taxonomy|podcasts|user|knowledge-center)/.+'  -C 'div.share' https://aviationweek.com/
newslinkrss -fB -p 'https://www.wired.com/story/.+' --body-csss 'div.body__inner-container' --author-from-xpath '//meta[@property="article:author"]/@content'  --categories-from-xpath '//meta[@name="keywords"]/@content' --split-categories ','  --title-regex '([^|]+)\s*' -T 'Wired Wired - stories only; no reviews, payola, etc.' https://www.wired.com/
newslinkrss -p 'https://www.semafor.com/.+/\d+/\d+/\d+/.+' -fB --body-csss main -C 'form, div[class*="styles_shareWrapper__"], div[class*="styles_mobileShare__"], div[class*="styles_navMenuWrapper__"], div[class*="styles_indexMenu__"]' --author-from-csss 'a[href*="/author/"]' --title-regex '^([^|]+)\s*|' --encoding utf-8 https://www.semafor.com/

J. R. R. Tolkien

newslinkrss --follow --with-body -p '^https://www.deviantart.com/.+/art/.+\d+' --body-xpath '//div[@data-hook="arrowL"]/../..//img | //div[@id="description"]' --title-from-csss h1 --date-from-xpath '(//main//time[@datetime]/@datetime)[1]' --author-from-xpath '//h1/../..//a[@data-username]/@data-username' --categories-from-csss 'a[href*="/tag/"].reset-link span' https://www.deviantart.com/tag/tolkien?order=most-recent  https://www.deviantart.com/search?q=tolkien
newslinkrss --follow --with-body -p '^https://www.deviantart.com/.+/art/.+\d+' --body-xpath '//div[@data-hook="arrowL"]/../..//img | //div[@id="description"]' --title-from-csss h1 --date-from-xpath '(//main//time[@datetime]/@datetime)[1]' --author-from-xpath '//h1/../..//a[@data-username]/@data-username' --categories-from-csss 'a[href*="/tag/"].reset-link span' https://www.deviantart.com/tag/lotrcosplay?order=most-recent https://www.deviantart.com/tag/silmarillioncosplay?order=most-recent  https://www.deviantart.com/search?q=tolkien+cosplay+or+silmarillion+cosplay+or+lotr+cosplay
newslinkrss --follow --with-body -p '^https://www.deviantart.com/.+/art/.+\d+' --body-xpath '//div[@data-hook="arrowL"]/../..//img | //div[@id="description"]' --title-from-csss h1 --date-from-xpath '(//time[@datetime]/@datetime)[1]' --author-from-xpath '//h1/../..//a[@data-username]/@data-username' --categories-from-csss 'a[href*="/tag/"].reset-link span' https://www.deviantart.com/silmarillion-club/gallery/

Science

newslinkrss -p 'https://www.nature.com/articles/.+' --follow  --with-body --body-csss 'main' --date-from-xpath '//time[@datetime]/@datetime' --title-regex '(.+)\s*\|\s*Nature' -C '.u-hide-print' -C '.hide-print' -C 'style' https://www.nature.com/
newslinkrss  --follow  -p 'https://www.reuters.com/.+/.+\d{4}-\d{2}-\d{2}.+'  --max-page-length 512  --with-body  --body-xpath '//article'  --body-remove-csss 'div[class*="article-header__toolbar__"], div[class*="article-body__toolbar__"]'  --body-remove-csss 'div[class*="article__read-next__"], div.read-next-panel'  --body-remove-csss 'div[class^="info-content__toolbar__"], div[data-testid="toolbar-container"], *[class^="social-links__container__"]' --require-dates  --title-regex '(.+)\s+\|'  https://www.reuters.com/science/

Computing

newslinkrss -p 'https://www.usenix.org/publications/loginonline/[^/]+' -i '.*/loginonline/writing$' -t 5 --follow --with-body --body-csss '#main-wrapper' --title-regex '^([^|]*[^|\s])' https://www.usenix.org/publications/loginonline
newslinkrss -p 'https://www.usenix.org/conference/[^/]+/presentation/.+' -t 5 --follow --with-body --body-csss 'article' --title-regex '^([^|]*[^|\s])' https://www.usenix.org/publications/proceedings

Sources in Portuguese / Fontes em Português

Jornais, revistas e TVs

newslinkrss --follow -p 'https://www.*\.folha\.uol\.com.br/.+/\d+/\d+/.+\.shtml' --with-body --body-csss 'header.c-content-head h1, header.c-content-head h2, div.c-signature, div.c-news__body' -C 'div.rs_skip'  --title-regex '(.+) - \d+/\d+/\d+ -\s+.+\s+- Folha' --author-from-csss '.c-signature__author a, .c-signature__author, cite.c-blog-top__author-name, .c-author__name a, .c-top-columnist__name a' --encoding 'utf-8' --max-page-length 512 --body-rename-attr img data-src src https://www1.folha.uol.com.br/ultimas-noticias/ https://www.folha.uol.com.br/
newslinkrss -f -B -p 'https://www.diariodajaragua.com.br/.+/[0-9]+/' --body-xpath '//article' --max-page-length 1024 https://www.diariodajaragua.com.br/jaragua-do-sul/ -X '//a[contains(@href, "https://chat.whatsapp.com")]/..' -C '.squareBanner' -X '//header' -X '//section'
newslinkrss -p 'https://oglobo.globo.com/.+noticia/\d+/\d+/\d+/.+.ghtml' -fB --body-csss 'section.content--header div.content-head, section.content--header div.content__signature, article' --date-from-xpath '//time[@itemprop="datePublished" and @datetime]/@datetime'  --author-from-xpath '//meta[@itemprop="name"]/@content | //address[@itemprop="author"]/*[@itemprop="name"]' -C 'section.mc-column.box-wrapper, section.passador-materia'  https://oglobo.globo.com/ultimas-noticias/ https://oglobo.globo.com/ultimas-noticias/index/feed/pagina-4 https://oglobo.globo.com/ultimas-noticias/index/feed/pagina-5 https://oglobo.globo.com/ultimas-noticias/index/feed/pagina-6
newslinkrss -p 'https://www\.correiobraziliense\.com\.br/.+/\d+/\d+/\d+-.+\.html' -i 'https://www\.correiobraziliense\.com\.br/webstories/.+' -i '.+/brandedcontent/.+' --follow --with-body --body-csss '.materia-title h1, .materia-title h2, article'  -C 'div.entry-headerBox, .noticia_notificacao, div.read-more, section.read-more, #socialBar, .socialBarWrapper' -C 'style, div#tags' --categories-from-csss '#tags ul li a' --encoding utf-8  https://www.correiobraziliense.com.br/
newslinkrss -p 'https://cultura.uol.com.br/.+/\d+/\d+/\d+/\d+.+\.html' -p 'https://cultura.uol.com.br/noticias/(.+/)?\d+_.+.html' -fB --body-csss '#programas-box-info aside h2, #programas-box-info aside p, article' --date-from-csss '#programas-box-info aside small' --csss-date-regex '\s*(\d+/\d+/\d+\s+\d+h\d+)\s*' --csss-date-fmt '%d/%m/%Y %Hh%M' --author-from-csss 'span.author' https://cultura.uol.com.br/entretenimento/ https://cultura.uol.com.br/noticias/

Colunistas

newslinkrss -p 'https://oglobo.globo.com/opiniao/elio-gaspari/.+/\d+/\d+/.+\.ghtml' -fB --body-csss 'section.content--header div.content-head, section.content--header div.content__signature, article' --date-from-xpath '//time[@itemprop="datePublished" and @datetime]/@datetime' --author-from-csss 'address.header-coluna__title' -C 'section.mc-column.box-wrapper, section.passador-materia' https://oglobo.globo.com/opiniao/elio-gaspari/
newslinkrss -p 'https://oglobo.globo.com/blogs/miriam-leitao/.+/\d+/\d+/.+\.ghtml' -fB --body-csss 'section.content--header div.content-head, section.content--header div.content__signature, article' --date-from-xpath '//time[@itemprop="datePublished" and @datetime]/@datetime' --author-from-csss 'address.header-coluna__title' -C 'section.mc-column.box-wrapper, section.passador-materia' https://oglobo.globo.com/blogs/miriam-leitao/ https://oglobo.globo.com/blogs/miriam-leitao/index/feed/pagina-4
newslinkrss --follow -p 'https://www1.folha.uol.com.br/colunas/helioschwartsman/\d+/\d+/.+\.shtml' --with-body --body-csss 'header.c-content-head h1, header.c-content-head h2, div.c-signature, div.c-news__body' -C 'div.rs_skip'  --title-regex '(.+) - \d+/\d+/\d+ -\s+.+\s+- Folha' --author-from-csss '.c-signature__author a, cite.c-blog-top__author-name, .c-author__name a, .c-top-columnist__name a' --encoding 'utf-8' --require-dates https://www1.folha.uol.com.br/colunas/helioschwartsman/
newslinkrss --follow -p 'https://www1.folha.uol.com.br/.+/\d+/\d+/.+\.shtml' --with-body --body-csss 'header.c-content-head h1, header.c-content-head h2, div.c-signature, div.c-news__body' -C 'div.rs_skip'  --title-regex '(.+) - \d+/\d+/\d+ -\s+.+\s+- Folha' --author-from-csss '.c-signature__author a, cite.c-blog-top__author-name, .c-author__name a, .c-top-columnist__name a' --encoding 'utf-8' --max-page-length 512 --require-dates https://www1.folha.uol.com.br/autores/reinaldo-jose-lopes.shtml
newslinkrss --follow -p 'https://www1.folha.uol.com.br/.+/lygia-maria/\d+/\d+/.+\.shtml' --with-body --body-csss 'header.c-content-head h1, header.c-content-head h2, div.c-signature, div.c-news__body' -C 'div.rs_skip'  --title-regex '(.+) - \d+/\d+/\d+ -\s+.+\s+- Folha' --author-from-csss '.c-signature__author a, cite.c-blog-top__author-name, .c-author__name a, .c-top-columnist__name a' --encoding 'utf-8' --max-page-length 512 --require-dates https://www1.folha.uol.com.br/colunas/lygia-maria/

Portais

newslinkrss --follow -t 4  -p 'https://noticias.uol.com.br/.+/\d+/\d+/.+' --date-from-xpath '//p[@ia-date-publish]/@ia-date-publish | //article//time[@datetime]/@datetime' --with-body --body-csss 'article div.author, article div.text, main article' --author-from-csss a.solar-author-name --title-regex '(.+)\s+- UOL Notícias' -X '//div[@ia-related-content]' -C 'div.ads-wrapper, .solar-ads, .jupiter-ads, .solar-comment, .jupiter-see-too, .solar-social-media, .jupiter-share' -C 'aside, div.related-content, .related-content-front, div.related-content-piano, .chartbeat-related-content, .related-content-hyperlink, .blogs-and-columns-recommendation' -C 'div.loading-box, div.clearfix, .new-post-notice, .new-post-notice-columnist' -C 'svg' -C 'style' -C 'img.img-author' -C 'div.magazine-cover' -C '.disclaimer-exclusive-content'  --body-rename-attr img data-src src https://noticias.uol.com.br/
newslinkrss --follow -p 'https://g1.globo.com/.+santa-catarina/.*\d+/\d+/\d+/.+\.ghtml' -i '.+/especial-publicitario/.+' --with-body --body-xpath '//article' -N amp-img img --date-from-xpath '//time[@datetime]/@datetime' --title-regex '([^|]+)' $(seq -f "https://g1.globo.com/sc/santa-catarina/index/feed/pagina-%.0f.ghtml"  1 5)
newslinkrss --follow -p 'https://g1.globo.com/.+parana/.*\d+/\d+/\d+/.+\.ghtml' -i '.+/especial-publicitario/.+' --with-body --body-xpath '//article' -N amp-img img --date-from-xpath '//time[@datetime]/@datetime' --title-regex '([^|]+)'  'https://g1.globo.com/pr/parana/'  $(seq -f "https://g1.globo.com/pr/parana/index/feed/pagina-%.0f.ghtml"  1 5)
newslinkrss -t 4 -p 'https://www.nsctotal.com.br/(noticias|colunistas/.+)/.+' -i '.+://www.nsctotal.com.br/noticias/noticias-whatsapp-nsc-total' --follow --with-body --body-csss '#post-content' --title-from-csss h1.title --author-from-csss '.author a'  --categories-from-csss 'div.tags a.tag' -C '.ad-single, .nsc-content-ads, .related-news, .col-md-auto h3' -C '#h-leia-tambem ~ p, #h-leia-tambem' -C '#h-leia-mais ~ p, #h-leia-mais' -C 'a[href*=whatsapp]'  https://www.nsctotal.com.br/tag/jaragua-do-sul https://www.nsctotal.com.br/tag/jaragua-do-sul?page=2 https://www.nsctotal.com.br/tag/jaragua-do-sul?page=3
newslinkrss -t 10 -p 'https://www.nsctotal.com.br/(noticias|colunistas/.+)/.+' -i '.+://www.nsctotal.com.br/noticias/noticias-whatsapp-nsc-total' --follow --with-body --body-csss '#post-content' --title-from-csss h1.title --author-from-csss '.author a'  --categories-from-csss 'div.tags a.tag' -C '.ad-single, .nsc-content-ads, .related-news, .col-md-auto h3' -C '#h-leia-tambem ~ p, #h-leia-tambem' -C '#h-leia-mais ~ p, #h-leia-mais' -C 'a[href*=whatsapp]'  https://www.nsctotal.com.br/cidades/joinville https://www.nsctotal.com.br/ultimas/cidades/joinville https://www.nsctotal.com.br/ultimas/cidades/joinville?page=2
newslinkrss -t 4 -p 'https://www.nsctotal.com.br/(noticias|colunistas/.+)/.+' -i '.+://www.nsctotal.com.br/noticias/noticias-whatsapp-nsc-total' --follow --with-body --body-csss '#post-content' --title-from-csss h1.title --author-from-csss '.author a'  --categories-from-csss 'div.tags a.tag' -C '.ad-single, .nsc-content-ads, .related-news, .col-md-auto h3' -C '#h-leia-tambem ~ p, #h-leia-tambem' -C '#h-leia-mais ~ p, #h-leia-mais' -C 'a[href*=whatsapp]'  https://www.nsctotal.com.br/ https://www.nsctotal.com.br/ultimas-noticias https://www.nsctotal.com.br/ultimas-noticias?paged=2
newslinkrss -f -B -p 'https://crusoe.com.br/(edicoes/\d+|secao|diario)/.+'  --body-csss 'article.post' -C 'style, svg' -C 'div.share, .container_share, div.tags' -C '#action-mark, #show-audio-player' -C '#wallcontent, #move-banner-box1' -C '.comment-section'  --date-from-csss 'span.data' --csss-date-regex '(\d+\.\d+.\d+ \d+:\d+)' --csss-date-fmt  '%d.%m.%y %H:%M' --title-regex '(.+\S)\s*-\s*Crusoé\s*$' --author-from-csss 'span.autor-info span' --no-cookies https://crusoe.com.br/
newslinkrss -n 30 -t 2 --follow --with-body --max-page-length 256 -p '^https://www.migalhas.com.br/(\w+/)+[0-9]+/.+' --body-xpath "//article" --require-dates -X '//app-compartilhamento-topo'  --title-regex '(.+)\s+-\s+Migalhas' https://www.migalhas.com.br/

Universidades

newslinkrss -n 100 -t 20 -T 'UDESC Joinville' -a '.*(\d{2}/\d{2}/\d{4}-\d{2}h\d{2}).*' --text-date-fmt '%d/%m/%Y-%Hh%M' -p '.+/cct/noticia/.+' https://www.udesc.br/cct/noticias

Entidades governamentais

newslinkrss -p 'https://www.jaraguadosul.sc.gov.br/news/.+' --http-timeout 10 --follow --with-body --body-csss 'div#area_impressao' --date-from-csss 'small.text-muted > b' https://www.jaraguadosul.sc.gov.br/noticias.php
newslinkrss -t 5 -p 'https://www.jaraguadosul.sc.leg.br/(destaques|geral)/.+' -fB --body-csss '.elementor-widget-theme-post-content' --title-regex '(.*\S)\s*-[^-]+$' https://www.jaraguadosul.sc.leg.br/  https://www.jaraguadosul.sc.leg.br/publicacoes/destaques/ https://www.jaraguadosul.sc.leg.br/geral/
newslinkrss -t 5 -p 'https://www.timbo.sc.gov.br/[a-z]+/20\d\d/.+/' --follow --with-body --body-csss article --title-from-csss 'article h1' --date-from-xpath '//article//time[@datetime]/@datetime' --categories-from-csss 'article ul li.entry-category a' -C 'div[role="complementary"], div.td-post-header, footer, div.td_block_related_posts, div#comments' https://www.timbo.sc.gov.br/noticias
newslinkrss -t 5 -p '^https://estado.sc.gov.br/noticias/[^/]+/?$' --follow --with-body --body-csss article.post -C '.addtoany_content' -i 'https://estado.sc.gov.br/noticias/todos-os-videos-da-tvsecom/?' -i 'https://estado.sc.gov.br/noticias/todos-os-audios-da-radio/?' -i 'https://estado.sc.gov.br/noticias/todas-as-noticias/?' -i 'https://estado.sc.gov.br/noticias/lista-de-assessores?/?' -i 'https://estado.sc.gov.br/noticias/transparencia/?' -i 'https://estado.sc.gov.br/noticias/todos-os-videos-da-tvsecom/?'   https://estado.sc.gov.br/noticias/ https://estado.sc.gov.br/noticias/todas-as-noticias/  https://estado.sc.gov.br/noticias/todas-as-noticias/page/2/ https://estado.sc.gov.br/noticias/todas-as-noticias/page/3/
newslinkrss -p '^https://www.gov.br/secom/pt-br/fatos/brasil-contra-fake/noticias/.+' --follow --with-body  --body-xpath '//article' --date-from-csss 'span.documentPublished span.value, span.documentModified span.value' --csss-date-fmt '%d/%m/%Y %Hh%M' -C 'div.social-links' --title-regex '(.+) — '  https://www.gov.br/secom/pt-br/fatos/brasil-contra-fake/noticias?b_size=60
newslinkrss -p '^https://www.gov.br/anatel/pt-br/assuntos/noticias/.+' --follow --with-body  --body-xpath '//article' --date-from-csss 'span.documentPublished span.value, span.documentModified span.value' --csss-date-fmt '%d/%m/%Y %Hh%M' -C 'div.social-links' --title-regex '(.+) — '  https://www.gov.br/anatel/pt-br/assuntos/noticias?b_size=40
newslinkrss -p '^https://www.gov.br/anpd/pt-br/assuntos/noticias/.+' --follow --with-body  --body-xpath '//article' --date-from-csss 'span.documentPublished span.value' --csss-date-fmt '%d/%m/%Y %Hh%M' -C 'div.social-links'  --title-regex '(.+) — '  https://www.gov.br/anpd/pt-br/assuntos/noticias
newslinkrss -t 10 --follow -p '^https://butantan.gov.br/noticias/.+' --max-page-length 2048 --with-body --body-xpath '//h2/..' --date-from-csss 'small' --csss-date-regex '\s*Publicado em:\s*(\d+/\d+/\d+)\s*' --csss-date-fmt '%d/%m/%Y' -C 'style'  https://butantan.gov.br/noticias/
newslinkrss -p 'https://www.tjsc.jus.br/web/imprensa/-/' --follow --with-body --body-csss '.journal-content-article' --date-from-csss '.tjsc-asset-publisher-list-asset-entry-date-time' --csss-date-fmt '%d %B %Y | %Hh%Mmin' -Q 'redirect' --title-regex '(.+) +- Imprensa' --locale 'pt_BR.UTF-8' https://www.tjsc.jus.br/web/imprensa/noticias
newslinkrss -t 4 --follow -p 'https://www.mpf.mp.br/.+/noticias-.+/.+' -B --body-csss 'div#content' https://www.mpf.mp.br/sala-de-imprensa/noticias
newslinkrss -t 10 --follow -p 'https://www.mpf.mp.br/.+/noticias-.+/.+' -B --body-csss 'div#content' https://www.mpf.mp.br/sc/sala-de-imprensa

Cultura em geral

newslinkrss -p 'https://scar.art.br/eventos/.+' --follow --with-body --body-xpath '//main' https://scar.art.br/evento/
newslinkrss  --follow -p 'https://www.academia.org.br/noticias/.*'  --with-body --body-xpath '(//*[@id="main-content"])/..' --title-regex '^([^|]+)\s+|'  https://www.academia.org.br/noticias/
newslinkrss  --follow -p 'https://www.academia.org.br/nossa-lingua/nova-palavra/.+' --with-body --body-xpath '(//*[@id="main-content"])/..'  https://www.academia.org.br/nossa-lingua/sobre-novas-palavras
newslinkrss -p '^https://www.estadao.com.br/cultura/.+/.+' -t 4 --follow --with-body --body-csss "header h1, header h2, div.informs, #content .content" -C ".ads-placeholder-label, #social-media-lower, .share-container" --date-from-csss 'time' --csss-date-regex '(\d+/\d+/\d+)' --csss-date-fmt '%d/%m/%Y' --title-regex '(.+) - Estadão' --author-from-csss '.informs .names a' --encoding utf-8 https://www.estadao.com.br/cultura/
newslinkrss  -n 30 -f -B -p '^https://www.omelete.com.br/.+/.+' --max-page-length 256 --require-dates --body-csss 'div.article__body' https://www.omelete.com.br/noticias

Outros

newslinkrss -p 'https://aeroin.net/[^/]+(-[^/]+){3,}/?$' -fB --body-csss 'article .td-post-content' -Q 'amp' -C 'i-amphtml-sizer, style' -C .td-post-sharing --author-from-xpath '//meta[@name="author"]/@content' https://aeroin.net/
newslinkrss  -p '^https://idec.org.br/.+/.+' --follow --with-body --body-csss '#main-content header, div.datapublicacao, div.field-name-field-linha-fina, div#content div.field-name-body div.field-item' --date-from-csss 'div.field-name-changed-date div.field-item, div.field-name-post-date div.field-item' --csss-date-fmt '%d/%m/%Y' --require-dates --title-regex '^([^|]+)\s*|' https://idec.org.br/noticias https://idec.org.br/artigos