summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorCoprDistGit <infra@openeuler.org>2023-05-17 03:43:08 +0000
committerCoprDistGit <infra@openeuler.org>2023-05-17 03:43:08 +0000
commitdad53eb8ce6a0f27f584144aba5cf63cc9d67e21 (patch)
tree2f3c1ed178a1925c1985b7bf5e91420e28fb271d
parent9cbde80239c3409242ba421f7986d34caf7ef55a (diff)
automatic import of python-brozzler
-rw-r--r--.gitignore1
-rw-r--r--python-brozzler.spec90
-rw-r--r--sources1
3 files changed, 92 insertions, 0 deletions
diff --git a/.gitignore b/.gitignore
index e69de29..82cac7b 100644
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1 @@
+/brozzler-1.5.18.tar.gz
diff --git a/python-brozzler.spec b/python-brozzler.spec
new file mode 100644
index 0000000..aeb73c8
--- /dev/null
+++ b/python-brozzler.spec
@@ -0,0 +1,90 @@
+%global _empty_manifest_terminate_build 0
+Name: python-brozzler
+Version: 1.5.18
+Release: 1
+Summary: Distributed web crawling with browsers
+License: Apache License 2.0
+URL: https://github.com/internetarchive/brozzler
+Source0: https://mirrors.nju.edu.cn/pypi/web/packages/b9/9e/7fa23d061f1dcbbe659740a675bff85804d715ce552ae7a3780e27c81537/brozzler-1.5.18.tar.gz
+BuildArch: noarch
+
+
+%description
+"browser" \| "crawler" = "brozzler"
+Brozzler is a distributed web crawler (爬虫) that uses a real browser (Chrome
+or Chromium) to fetch pages and embedded URLs and to extract links. It employs
+`youtube-dl <https://github.com/rg3/youtube-dl>`_ to enhance media capture
+capabilities and `rethinkdb <https://github.com/rethinkdb/rethinkdb>`_ to
+manage crawl state.
+Brozzler is designed to work in conjuction with warcprox for web archiving.
+
+%package -n python3-brozzler
+Summary: Distributed web crawling with browsers
+Provides: python-brozzler
+BuildRequires: python3-devel
+BuildRequires: python3-setuptools
+BuildRequires: python3-pip
+%description -n python3-brozzler
+"browser" \| "crawler" = "brozzler"
+Brozzler is a distributed web crawler (爬虫) that uses a real browser (Chrome
+or Chromium) to fetch pages and embedded URLs and to extract links. It employs
+`youtube-dl <https://github.com/rg3/youtube-dl>`_ to enhance media capture
+capabilities and `rethinkdb <https://github.com/rethinkdb/rethinkdb>`_ to
+manage crawl state.
+Brozzler is designed to work in conjuction with warcprox for web archiving.
+
+%package help
+Summary: Development documents and examples for brozzler
+Provides: python3-brozzler-doc
+%description help
+"browser" \| "crawler" = "brozzler"
+Brozzler is a distributed web crawler (爬虫) that uses a real browser (Chrome
+or Chromium) to fetch pages and embedded URLs and to extract links. It employs
+`youtube-dl <https://github.com/rg3/youtube-dl>`_ to enhance media capture
+capabilities and `rethinkdb <https://github.com/rethinkdb/rethinkdb>`_ to
+manage crawl state.
+Brozzler is designed to work in conjuction with warcprox for web archiving.
+
+%prep
+%autosetup -n brozzler-1.5.18
+
+%build
+%py3_build
+
+%install
+%py3_install
+install -d -m755 %{buildroot}/%{_pkgdocdir}
+if [ -d doc ]; then cp -arf doc %{buildroot}/%{_pkgdocdir}; fi
+if [ -d docs ]; then cp -arf docs %{buildroot}/%{_pkgdocdir}; fi
+if [ -d example ]; then cp -arf example %{buildroot}/%{_pkgdocdir}; fi
+if [ -d examples ]; then cp -arf examples %{buildroot}/%{_pkgdocdir}; fi
+pushd %{buildroot}
+if [ -d usr/lib ]; then
+ find usr/lib -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/lib64 ]; then
+ find usr/lib64 -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/bin ]; then
+ find usr/bin -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/sbin ]; then
+ find usr/sbin -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+touch doclist.lst
+if [ -d usr/share/man ]; then
+ find usr/share/man -type f -printf "/%h/%f.gz\n" >> doclist.lst
+fi
+popd
+mv %{buildroot}/filelist.lst .
+mv %{buildroot}/doclist.lst .
+
+%files -n python3-brozzler -f filelist.lst
+%dir %{python3_sitelib}/*
+
+%files help -f doclist.lst
+%{_docdir}/*
+
+%changelog
+* Wed May 17 2023 Python_Bot <Python_Bot@openeuler.org> - 1.5.18-1
+- Package Spec generated
diff --git a/sources b/sources
new file mode 100644
index 0000000..61f828a
--- /dev/null
+++ b/sources
@@ -0,0 +1 @@
+92bcda2a5389bfc7939568e5bc1c4801 brozzler-1.5.18.tar.gz