diff options
author | Steve George <steve@futurile.net> | 2024-04-26 13:42:00 +0200 |
---|---|---|
committer | Ludovic Courtès <ludo@gnu.org> | 2024-05-04 19:14:26 +0200 |
commit | 421372c4cdde4b86fab8fb18c90f055d49a4c7bd (patch) | |
tree | fbd3d4415903308fd31055d4a02ffa34c9f22b16 /gnu/packages/web.scm | |
parent | f2d83b3352559181eea71b45e109286d61a79925 (diff) |
gnu: Add perl-web-scraper.
* gnu/packages/web.scm (perl-web-scraper): New variable.
Change-Id: I3d0a476ca6c09bc20391303f99b260410f16de65
Signed-off-by: Ludovic Courtès <ludo@gnu.org>
Diffstat (limited to 'gnu/packages/web.scm')
-rw-r--r-- | gnu/packages/web.scm | 32 |
1 files changed, 32 insertions, 0 deletions
diff --git a/gnu/packages/web.scm b/gnu/packages/web.scm index c3ef146750..80f281b4e6 100644 --- a/gnu/packages/web.scm +++ b/gnu/packages/web.scm @@ -4778,6 +4778,38 @@ URI::Find::Schemeless. For a command-line interface, urifind is provided.") methods for WebSocket URIs as it does for HTTP URIs.") (license license:perl-license))) +(define-public perl-web-scraper + (package + (name "perl-web-scraper") + (version "0.38") + (source + (origin + (method url-fetch) + (uri (string-append "mirror://cpan/authors/id/M/MI/MIYAGAWA/Web-Scraper-" + version ".tar.gz")) + (sha256 + (base32 "1gs3fmbc83j34c0sig1hkpnm26ngnyi5kgq5dl8vxvkzimgnwnzr")))) + (build-system perl-build-system) + (native-inputs (list perl-module-build-tiny + perl-test-base + perl-test-requires)) + (propagated-inputs (list perl-html-parser + perl-html-selector-xpath + perl-html-tagset + perl-html-tree + perl-html-treebuilder-xpath + perl-libwww + perl-universal-require + perl-uri + perl-xml-xpathengine + perl-yaml)) + (home-page "https://metacpan.org/release/Web-Scraper") + (synopsis + "Web Scraping toolkit using HTML and CSS Selectors or XPath expressions") + (description "Perl module @code{Web::Scraper} is a toolkit for +traversing and scraping sites, inspired by Ruby's Scapi.") + (license license:perl-license))) + (define-public perl-uri-template (package (name "perl-uri-template") |