blob: 71a1863f89c3badea54b2103ae169a142917409d (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
|
%global _empty_manifest_terminate_build 0
Name: python-trafilatura
Version: 1.5.0
Release: 1
Summary: Python package and command-line tool designed to gather text on the Web. It includes discovery, extraction and text processing components. Its main applications are web crawling, downloads, scraping, and extraction of main texts, metadata and comments.
License: GPLv3+
URL: https://trafilatura.readthedocs.io
Source0: https://mirrors.nju.edu.cn/pypi/web/packages/d8/aa/5e4f48ecbd5399ff0e3b452fa7befeb7d21060c698ebc71409fd3ad79e18/trafilatura-1.5.0.tar.gz
BuildArch: noarch
Requires: python3-certifi
Requires: python3-courlan
Requires: python3-htmldate
Requires: python3-justext
Requires: python3-lxml
Requires: python3-urllib3
Requires: python3-charset-normalizer
Requires: python3-charset-normalizer
Requires: python3-brotli
Requires: python3-htmldate[speed]
Requires: python3-py3langid
Requires: python3-pycurl
Requires: python3-cchardet
Requires: python3-faust-cchardet
Requires: python3-Gooey
%description
|
|
%package -n python3-trafilatura
Summary: Python package and command-line tool designed to gather text on the Web. It includes discovery, extraction and text processing components. Its main applications are web crawling, downloads, scraping, and extraction of main texts, metadata and comments.
Provides: python-trafilatura
BuildRequires: python3-devel
BuildRequires: python3-setuptools
BuildRequires: python3-pip
%description -n python3-trafilatura
|
|
%package help
Summary: Development documents and examples for trafilatura
Provides: python3-trafilatura-doc
%description help
|
|
%prep
%autosetup -n trafilatura-1.5.0
%build
%py3_build
%install
%py3_install
install -d -m755 %{buildroot}/%{_pkgdocdir}
if [ -d doc ]; then cp -arf doc %{buildroot}/%{_pkgdocdir}; fi
if [ -d docs ]; then cp -arf docs %{buildroot}/%{_pkgdocdir}; fi
if [ -d example ]; then cp -arf example %{buildroot}/%{_pkgdocdir}; fi
if [ -d examples ]; then cp -arf examples %{buildroot}/%{_pkgdocdir}; fi
pushd %{buildroot}
if [ -d usr/lib ]; then
find usr/lib -type f -printf "/%h/%f\n" >> filelist.lst
fi
if [ -d usr/lib64 ]; then
find usr/lib64 -type f -printf "/%h/%f\n" >> filelist.lst
fi
if [ -d usr/bin ]; then
find usr/bin -type f -printf "/%h/%f\n" >> filelist.lst
fi
if [ -d usr/sbin ]; then
find usr/sbin -type f -printf "/%h/%f\n" >> filelist.lst
fi
touch doclist.lst
if [ -d usr/share/man ]; then
find usr/share/man -type f -printf "/%h/%f.gz\n" >> doclist.lst
fi
popd
mv %{buildroot}/filelist.lst .
mv %{buildroot}/doclist.lst .
%files -n python3-trafilatura -f filelist.lst
%dir %{python3_sitelib}/*
%files help -f doclist.lst
%{_docdir}/*
%changelog
* Mon Apr 10 2023 Python_Bot <Python_Bot@openeuler.org> - 1.5.0-1
- Package Spec generated
|