summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorSteve George <steve@futurile.net>2024-04-26 13:42:00 +0200
committerLudovic Courtès <ludo@gnu.org>2024-05-04 19:14:26 +0200
commit421372c4cdde4b86fab8fb18c90f055d49a4c7bd (patch)
treefbd3d4415903308fd31055d4a02ffa34c9f22b16
parentf2d83b3352559181eea71b45e109286d61a79925 (diff)
downloadguix-patches-421372c4cdde4b86fab8fb18c90f055d49a4c7bd.tar
guix-patches-421372c4cdde4b86fab8fb18c90f055d49a4c7bd.tar.gz
gnu: Add perl-web-scraper.
* gnu/packages/web.scm (perl-web-scraper): New variable. Change-Id: I3d0a476ca6c09bc20391303f99b260410f16de65 Signed-off-by: Ludovic Courtès <ludo@gnu.org>
-rw-r--r--gnu/packages/web.scm32
1 files changed, 32 insertions, 0 deletions
diff --git a/gnu/packages/web.scm b/gnu/packages/web.scm
index c3ef146750..80f281b4e6 100644
--- a/gnu/packages/web.scm
+++ b/gnu/packages/web.scm
@@ -4778,6 +4778,38 @@ URI::Find::Schemeless. For a command-line interface, urifind is provided.")
methods for WebSocket URIs as it does for HTTP URIs.")
(license license:perl-license)))
+(define-public perl-web-scraper
+ (package
+ (name "perl-web-scraper")
+ (version "0.38")
+ (source
+ (origin
+ (method url-fetch)
+ (uri (string-append "mirror://cpan/authors/id/M/MI/MIYAGAWA/Web-Scraper-"
+ version ".tar.gz"))
+ (sha256
+ (base32 "1gs3fmbc83j34c0sig1hkpnm26ngnyi5kgq5dl8vxvkzimgnwnzr"))))
+ (build-system perl-build-system)
+ (native-inputs (list perl-module-build-tiny
+ perl-test-base
+ perl-test-requires))
+ (propagated-inputs (list perl-html-parser
+ perl-html-selector-xpath
+ perl-html-tagset
+ perl-html-tree
+ perl-html-treebuilder-xpath
+ perl-libwww
+ perl-universal-require
+ perl-uri
+ perl-xml-xpathengine
+ perl-yaml))
+ (home-page "https://metacpan.org/release/Web-Scraper")
+ (synopsis
+ "Web Scraping toolkit using HTML and CSS Selectors or XPath expressions")
+ (description "Perl module @code{Web::Scraper} is a toolkit for
+traversing and scraping sites, inspired by Ruby's Scapi.")
+ (license license:perl-license)))
+
(define-public perl-uri-template
(package
(name "perl-uri-template")