Compare commits
100 Commits
Author | SHA1 | Date |
---|---|---|
tastytea | 449e315397 | |
tastytea | 7eae29031f | |
tastytea | 531a409124 | |
tastytea | 22a50ef661 | |
tastytea | 94555621d8 | |
tastytea | cfe274f1e1 | |
tastytea | eb4630d738 | |
tastytea | bbc412db45 | |
tastytea | c0a2f7e779 | |
tastytea | 4b5e6898cd | |
tastytea | c16265683f | |
tastytea | d438e2292f | |
tastytea | 089eac4cfc | |
tastytea | 63a8ab2683 | |
tastytea | cd03898039 | |
tastytea | 550a1143a5 | |
tastytea | d1083b7dca | |
tastytea | 1058903def | |
tastytea | 5d28b1f4ef | |
tastytea | bb37e53207 | |
tastytea | 1bddad7083 | |
tastytea | 7daade6425 | |
tastytea | c41f3a2485 | |
tastytea | 3e23dc2cd9 | |
tastytea | 9c6dd5ca64 | |
tastytea | c62799e00f | |
tastytea | 636e84408c | |
tastytea | ef77a9e4fb | |
tastytea | 552df1a49e | |
tastytea | 1e0cde8a4b | |
tastytea | 2bede91fb7 | |
tastytea | 165592982a | |
tastytea | b1dcdea95e | |
tastytea | 299063e02c | |
tastytea | fca719634a | |
tastytea | d2aff45018 | |
tastytea | b134bd0301 | |
tastytea | d0738891c2 | |
tastytea | b53e99306c | |
tastytea | 84ef5d1bf3 | |
tastytea | 97fecd37f0 | |
tastytea | e154b62201 | |
tastytea | 90eb30fa3e | |
tastytea | 9cc1823b3b | |
tastytea | 2489c444df | |
tastytea | c99c01162d | |
tastytea | 49de44f729 | |
tastytea | bdcf153b47 | |
tastytea | 57c87ca5e7 | |
tastytea | 5c0ca46c9d | |
tastytea | 691dea092d | |
tastytea | 07ec6f789f | |
tastytea | 979dc9334c | |
tastytea | 961deff41d | |
tastytea | 1cf6306f4b | |
tastytea | 822bff1955 | |
tastytea | 18c3d8f58d | |
tastytea | b2a6f9217b | |
tastytea | babd7e4f61 | |
tastytea | ed86f3a56d | |
tastytea | f8270369b6 | |
tastytea | 3966b99c3f | |
tastytea | 37c2fe1bb1 | |
tastytea | a77b90c8b1 | |
tastytea | 42e5e52e1b | |
tastytea | 1eb763fc37 | |
tastytea | 633274e3dd | |
tastytea | 51f8422929 | |
tastytea | 8b5c0d289e | |
tastytea | 7b817c42d1 | |
tastytea | be4d8aecd0 | |
tastytea | 1c8279f96f | |
tastytea | f59c86e20d | |
tastytea | 0470acb00e | |
tastytea | 1e29608c7e | |
tastytea | 5e89a71e00 | |
tastytea | 9708bb69c8 | |
tastytea | b8431019b7 | |
tastytea | ebb8b63830 | |
tastytea | a49c500d0f | |
tastytea | 262aab6671 | |
tastytea | 9067b387ef | |
tastytea | 99e1cd8e98 | |
tastytea | bdf9a86651 | |
tastytea | f1a0015f28 | |
tastytea | fbf86f51d1 | |
tastytea | 12e1c64fc0 | |
tastytea | 4026937f08 | |
tastytea | cb2aee847f | |
tastytea | 4b09158037 | |
tastytea | 226b66b77b | |
tastytea | 92b8281242 | |
tastytea | 2b51229518 | |
tastytea | bc34a3a515 | |
tastytea | 85a00bb23c | |
tastytea | d83f485fb4 | |
tastytea | 7252463fbb | |
tastytea | 7d8cf7de91 | |
tastytea | 5af10f6767 | |
tastytea | d1c74d244d |
15
.clang-tidy
15
.clang-tidy
|
@ -1,5 +1,4 @@
|
||||||
# -*- mode: conf; fill-column: 100; -*-
|
# Written for clang-tidy 14.
|
||||||
# Written for clang-tidy 11.
|
|
||||||
|
|
||||||
---
|
---
|
||||||
Checks: '*,
|
Checks: '*,
|
||||||
|
@ -29,7 +28,9 @@ Checks: '*,
|
||||||
-fuchsia-multiple-inheritance,
|
-fuchsia-multiple-inheritance,
|
||||||
-llvmlibc*,
|
-llvmlibc*,
|
||||||
-cppcoreguidelines-avoid-non-const-global-variables,
|
-cppcoreguidelines-avoid-non-const-global-variables,
|
||||||
-cert-*-c'
|
-cert-*-c,
|
||||||
|
-abseil-string-find-*,
|
||||||
|
-altera-*'
|
||||||
FormatStyle: file # Use .clang-format.
|
FormatStyle: file # Use .clang-format.
|
||||||
CheckOptions: # ↓ Clashes with static private member prefix. (static int _var;) ↓
|
CheckOptions: # ↓ Clashes with static private member prefix. (static int _var;) ↓
|
||||||
- { key: readability-identifier-naming.VariableCase, value: lower_case }
|
- { key: readability-identifier-naming.VariableCase, value: lower_case }
|
||||||
|
@ -39,9 +40,15 @@ CheckOptions: # ↓ Clashes with static private member prefix. (static int _va
|
||||||
- { key: readability-identifier-naming.ProtectedMemberCase, value: lower_case }
|
- { key: readability-identifier-naming.ProtectedMemberCase, value: lower_case }
|
||||||
- { key: readability-identifier-naming.ProtectedMemberPrefix, value: _ }
|
- { key: readability-identifier-naming.ProtectedMemberPrefix, value: _ }
|
||||||
|
|
||||||
- { key: readability-identifier-naming.ClassCase, value: lower_case }
|
- { key: readability-identifier-naming.ClassCase, value: lower_case }
|
||||||
- { key: readability-identifier-naming.StructCase, value: lower_case }
|
- { key: readability-identifier-naming.StructCase, value: lower_case }
|
||||||
- { key: readability-identifier-naming.EnumCase, value: lower_case }
|
- { key: readability-identifier-naming.EnumCase, value: lower_case }
|
||||||
- { key: readability-identifier-naming.FunctionCase, value: lower_case }
|
- { key: readability-identifier-naming.FunctionCase, value: lower_case }
|
||||||
- { key: readability-identifier-naming.ParameterCase, value: lower_case }
|
- { key: readability-identifier-naming.ParameterCase, value: lower_case }
|
||||||
|
|
||||||
|
- { key: readability-function-cognitive-complexity.Threshold, value: 30 }
|
||||||
|
- { key: readability-identifier-length.MinimumVariableNameLength, value: 2 }
|
||||||
...
|
...
|
||||||
|
|
||||||
|
# -*- mode: yaml; fill-column: 100; -*-
|
||||||
|
# vim: set fenc=utf-8 tw=100 et ft=yaml:
|
||||||
|
|
|
@ -0,0 +1,5 @@
|
||||||
|
{
|
||||||
|
"format": {
|
||||||
|
"disable": true
|
||||||
|
}
|
||||||
|
}
|
166
.drone.yml
166
.drone.yml
|
@ -4,9 +4,12 @@ kind: pipeline
|
||||||
type: docker
|
type: docker
|
||||||
|
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
host:
|
host:
|
||||||
path: /var/cache/debian-package-cache
|
path: /var/cache/deb-package-cache
|
||||||
|
- name: rpm-package-cache
|
||||||
|
host:
|
||||||
|
path: /var/cache/rpm-package-cache
|
||||||
|
|
||||||
trigger:
|
trigger:
|
||||||
event:
|
event:
|
||||||
|
@ -14,7 +17,7 @@ trigger:
|
||||||
- tag
|
- tag
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- name: GCC 10 / clang 11
|
- name: GCC 10 / clang 11 (debug)
|
||||||
image: debian:bullseye-slim
|
image: debian:bullseye-slim
|
||||||
pull: always
|
pull: always
|
||||||
environment:
|
environment:
|
||||||
|
@ -28,19 +31,19 @@ steps:
|
||||||
- apt-get update -q
|
- apt-get update -q
|
||||||
- apt-get install -qq build-essential cmake clang locales
|
- apt-get install -qq build-essential cmake clang locales
|
||||||
- apt-get install -qq catch libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json3-dev
|
- apt-get install -qq catch libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json3-dev
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
- cmake -DCMAKE_BUILD_TYPE=Debug -G "Unix Makefiles" -DWITH_TESTS=YES -DWITH_SANITIZERS=YES ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cd tests && ctest -V
|
- ctest -V
|
||||||
- cd ../../
|
- cd ../
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- CXX="clang++" cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
- CXX="clang++" cmake -DCMAKE_BUILD_TYPE=Debug -G "Unix Makefiles" -DWITH_TESTS=YES -DWITH_SANITIZERS=YES ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cd tests && ctest -V
|
- ctest -V
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
path: /var/cache/apt/archives
|
path: /var/cache/apt/archives
|
||||||
|
|
||||||
- name: Download CMake 3.12 installer
|
- name: Download CMake 3.12 installer
|
||||||
|
@ -69,20 +72,43 @@ steps:
|
||||||
- apt-get install -qq catch libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json-dev
|
- apt-get install -qq catch libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json-dev
|
||||||
- sh cmake_installer.sh --skip-license --exclude-subdir --prefix=/usr/local
|
- sh cmake_installer.sh --skip-license --exclude-subdir --prefix=/usr/local
|
||||||
- cp /usr/lib/x86_64-linux-gnu/libpugixml* /lib/x86_64-linux-gnu/
|
- cp /usr/lib/x86_64-linux-gnu/libpugixml* /lib/x86_64-linux-gnu/
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
- cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cd tests && ctest -V
|
- ctest -V
|
||||||
- cd ../../
|
- cd ../
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- CXX="clang++" cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
- CXX="clang++" cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cd tests && ctest -V
|
- ctest -V
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
path: /var/cache/apt/archives
|
path: /var/cache/apt/archives
|
||||||
|
depends_on:
|
||||||
|
- GCC 10 / clang 11 (debug)
|
||||||
|
- Download CMake 3.12 installer
|
||||||
|
|
||||||
|
- name: GCC 9
|
||||||
|
image: opensuse/leap:15
|
||||||
|
pull: always
|
||||||
|
environment:
|
||||||
|
CXX: g++-9
|
||||||
|
CXXFLAGS: -pipe -O2
|
||||||
|
LANG: C.UTF-8
|
||||||
|
commands:
|
||||||
|
- zypper --non-interactive modifyrepo --all --keep-packages
|
||||||
|
- zypper --non-interactive install cmake gcc9-c++ rpm-build
|
||||||
|
- zypper --non-interactive install Catch2-devel libboost_program_options1_75_0-devel libboost_locale1_75_0-devel libboost_log1_75_0-devel fmt-devel libarchive-devel pugixml-devel nlohmann_json-devel asciidoc
|
||||||
|
- rm -rf build_rpm && mkdir -p build_rpm && cd build_rpm
|
||||||
|
- cmake -G "Unix Makefiles" -DWITH_TESTS=YES ..
|
||||||
|
- make VERBOSE=1
|
||||||
|
- make install DESTDIR=install
|
||||||
|
- ctest -V
|
||||||
|
volumes:
|
||||||
|
- name: rpm-package-cache
|
||||||
|
path: /var/cache/zypp/packages
|
||||||
|
|
||||||
- name: notify
|
- name: notify
|
||||||
image: drillster/drone-email
|
image: drillster/drone-email
|
||||||
|
@ -96,6 +122,11 @@ steps:
|
||||||
from_secret: email_password
|
from_secret: email_password
|
||||||
when:
|
when:
|
||||||
status: [ changed, failure ]
|
status: [ changed, failure ]
|
||||||
|
depends_on:
|
||||||
|
- GCC 10 / clang 11 (debug)
|
||||||
|
- Download CMake 3.12 installer
|
||||||
|
- GCC 9
|
||||||
|
- GCC 8 / clang 6
|
||||||
|
|
||||||
---
|
---
|
||||||
name: Packages x86_64
|
name: Packages x86_64
|
||||||
|
@ -103,15 +134,40 @@ kind: pipeline
|
||||||
type: docker
|
type: docker
|
||||||
|
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
host:
|
host:
|
||||||
path: /var/cache/debian-package-cache
|
path: /var/cache/deb-package-cache
|
||||||
|
|
||||||
trigger:
|
trigger:
|
||||||
event:
|
event:
|
||||||
- tag
|
- tag
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
|
- name: Debian bullseye
|
||||||
|
image: debian:bullseye-slim
|
||||||
|
pull: always
|
||||||
|
environment:
|
||||||
|
CXX: g++-10
|
||||||
|
CXXFLAGS: -pipe -O2
|
||||||
|
DEBIAN_FRONTEND: noninteractive
|
||||||
|
LANG: C.UTF-8
|
||||||
|
commands:
|
||||||
|
- rm /etc/apt/apt.conf.d/docker-clean
|
||||||
|
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
||||||
|
- apt-get update -q
|
||||||
|
- apt-get install -qq build-essential cmake clang locales lsb-release file
|
||||||
|
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev libpugixml-dev nlohmann-json3-dev
|
||||||
|
- apt-get install -qq --no-install-recommends asciidoc xsltproc
|
||||||
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
|
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
||||||
|
- make VERBOSE=1
|
||||||
|
- make install DESTDIR=install
|
||||||
|
- cpack -G DEB
|
||||||
|
- cp -v epubgrep_${DRONE_TAG}-0_amd64_bullseye.deb ..
|
||||||
|
volumes:
|
||||||
|
- name: deb-package-cache
|
||||||
|
path: /var/cache/apt/archives
|
||||||
|
|
||||||
- name: Debian buster
|
- name: Debian buster
|
||||||
image: debian:buster-slim
|
image: debian:buster-slim
|
||||||
pull: always
|
pull: always
|
||||||
|
@ -125,17 +181,20 @@ steps:
|
||||||
- rm /etc/apt/apt.conf.d/docker-clean
|
- rm /etc/apt/apt.conf.d/docker-clean
|
||||||
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
||||||
- apt-get update -q
|
- apt-get update -q
|
||||||
- apt-get install -qq build-essential cmake clang locales lsb-release
|
- apt-get install -qq build-essential cmake clang locales lsb-release file
|
||||||
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json-dev
|
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev libpugixml-dev nlohmann-json-dev
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- apt-get install -qq --no-install-recommends asciidoc xsltproc
|
||||||
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cpack -G DEB
|
- cpack -G DEB
|
||||||
- cp -v epubgrep_${DRONE_TAG}-0_amd64_buster.deb ..
|
- cp -v epubgrep_${DRONE_TAG}-0_amd64_buster.deb ..
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
path: /var/cache/apt/archives
|
path: /var/cache/apt/archives
|
||||||
|
depends_on:
|
||||||
|
- Debian bullseye
|
||||||
|
|
||||||
- name: Ubuntu focal
|
- name: Ubuntu focal
|
||||||
image: ubuntu:focal
|
image: ubuntu:focal
|
||||||
|
@ -149,17 +208,21 @@ steps:
|
||||||
- rm /etc/apt/apt.conf.d/docker-clean
|
- rm /etc/apt/apt.conf.d/docker-clean
|
||||||
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
||||||
- apt-get update -q
|
- apt-get update -q
|
||||||
- apt-get install -qq build-essential cmake clang locales lsb-release
|
- apt-get install -qq build-essential cmake clang locales lsb-release file
|
||||||
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json3-dev
|
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev libpugixml-dev nlohmann-json3-dev
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- apt-get install -qq --no-install-recommends asciidoc xsltproc
|
||||||
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cpack -G DEB
|
- cpack -G DEB
|
||||||
- cp -v epubgrep_${DRONE_TAG}-0_amd64_focal.deb ..
|
- cp -v epubgrep_${DRONE_TAG}-0_amd64_focal.deb ..
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
path: /var/cache/apt/archives
|
path: /var/cache/apt/archives
|
||||||
|
depends_on:
|
||||||
|
- Debian bullseye
|
||||||
|
- Debian buster
|
||||||
|
|
||||||
- name: Download CMake 3.12 installer
|
- name: Download CMake 3.12 installer
|
||||||
image: plugins/download
|
image: plugins/download
|
||||||
|
@ -183,19 +246,46 @@ steps:
|
||||||
- rm /etc/apt/apt.conf.d/docker-clean
|
- rm /etc/apt/apt.conf.d/docker-clean
|
||||||
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
- alias apt-get='rm -f /var/cache/apt/archives/lock && apt-get'
|
||||||
- apt-get update -q
|
- apt-get update -q
|
||||||
- apt-get install -qq g++-8 build-essential clang locales lsb-release
|
- apt-get install -qq g++-8 build-essential clang locales lsb-release file
|
||||||
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev asciidoc libpugixml-dev nlohmann-json-dev
|
- apt-get install -qq libboost-program-options-dev libboost-locale-dev libboost-regex-dev libboost-log-dev gettext libarchive-dev libfmt-dev libpugixml-dev nlohmann-json-dev
|
||||||
|
- apt-get install -qq --no-install-recommends asciidoc xsltproc
|
||||||
- sh cmake_installer.sh --skip-license --exclude-subdir --prefix=/usr/local
|
- sh cmake_installer.sh --skip-license --exclude-subdir --prefix=/usr/local
|
||||||
- cp /usr/lib/x86_64-linux-gnu/libpugixml* /lib/x86_64-linux-gnu/
|
- cp /usr/lib/x86_64-linux-gnu/libpugixml* /lib/x86_64-linux-gnu/
|
||||||
- rm -rf build && mkdir -p build && cd build
|
- rm -rf build_deb && mkdir -p build_deb && cd build_deb
|
||||||
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
||||||
- make VERBOSE=1
|
- make VERBOSE=1
|
||||||
- make install DESTDIR=install
|
- make install DESTDIR=install
|
||||||
- cpack -G DEB
|
- cpack -G DEB
|
||||||
- cp -v epubgrep_${DRONE_TAG}-0_amd64_bionic.deb ..
|
- cp -v epubgrep_${DRONE_TAG}-0_amd64_bionic.deb ..
|
||||||
volumes:
|
volumes:
|
||||||
- name: debian-package-cache
|
- name: deb-package-cache
|
||||||
path: /var/cache/apt/archives
|
path: /var/cache/apt/archives
|
||||||
|
depends_on:
|
||||||
|
- Debian bullseye
|
||||||
|
- Debian buster
|
||||||
|
- Ubuntu focal
|
||||||
|
- Download CMake 3.12 installer
|
||||||
|
|
||||||
|
- name: openSUSE Leap 15
|
||||||
|
image: opensuse/leap:15
|
||||||
|
pull: always
|
||||||
|
environment:
|
||||||
|
CXX: g++-9
|
||||||
|
CXXFLAGS: -pipe -O2
|
||||||
|
LANG: C.UTF-8
|
||||||
|
commands:
|
||||||
|
- zypper --non-interactive modifyrepo --all --keep-packages
|
||||||
|
- zypper --non-interactive install cmake gcc9-c++ rpm-build lsb-release
|
||||||
|
- zypper --non-interactive install libboost_program_options1_75_0-devel libboost_locale1_75_0-devel libboost_log1_75_0-devel fmt-devel libarchive-devel pugixml-devel nlohmann_json-devel asciidoc
|
||||||
|
- rm -rf build_rpm && mkdir -p build_rpm && cd build_rpm
|
||||||
|
- cmake -G "Unix Makefiles" -DCMAKE_INSTALL_PREFIX=/usr ..
|
||||||
|
- make VERBOSE=1
|
||||||
|
- make install DESTDIR=install
|
||||||
|
- cpack -G RPM
|
||||||
|
- cp -v epubgrep-${DRONE_TAG}-0.x86_64.opensuse-$(lsb_release --release --short).rpm ..
|
||||||
|
volumes:
|
||||||
|
- name: rpm-package-cache
|
||||||
|
path: /var/cache/zypp/packages
|
||||||
|
|
||||||
- name: gitea_release
|
- name: gitea_release
|
||||||
image: plugins/gitea-release
|
image: plugins/gitea-release
|
||||||
|
@ -208,10 +298,18 @@ steps:
|
||||||
prerelease: true
|
prerelease: true
|
||||||
files:
|
files:
|
||||||
- epubgrep_${DRONE_TAG}-0_amd64_buster.deb
|
- epubgrep_${DRONE_TAG}-0_amd64_buster.deb
|
||||||
|
- epubgrep_${DRONE_TAG}-0_amd64_bullseye.deb
|
||||||
- epubgrep_${DRONE_TAG}-0_amd64_focal.deb
|
- epubgrep_${DRONE_TAG}-0_amd64_focal.deb
|
||||||
- epubgrep_${DRONE_TAG}-0_amd64_bionic.deb
|
- epubgrep_${DRONE_TAG}-0_amd64_bionic.deb
|
||||||
|
- epubgrep-${DRONE_TAG}-0.x86_64.opensuse-$(lsb_release --release --short).rpm
|
||||||
checksum:
|
checksum:
|
||||||
- sha512
|
- sha512
|
||||||
|
depends_on:
|
||||||
|
- Debian bullseye
|
||||||
|
- Debian buster
|
||||||
|
- Ubuntu focal
|
||||||
|
- Ubuntu bionic
|
||||||
|
- openSUSE Leap 15
|
||||||
|
|
||||||
- name: notification
|
- name: notification
|
||||||
image: drillster/drone-email
|
image: drillster/drone-email
|
||||||
|
@ -225,3 +323,9 @@ steps:
|
||||||
from_secret: email_password
|
from_secret: email_password
|
||||||
when:
|
when:
|
||||||
status: [ changed, failure ]
|
status: [ changed, failure ]
|
||||||
|
depends_on:
|
||||||
|
- Debian bullseye
|
||||||
|
- Debian buster
|
||||||
|
- Ubuntu focal
|
||||||
|
- Download CMake 3.12 installer
|
||||||
|
- Ubuntu bionic
|
||||||
|
|
|
@ -3,3 +3,5 @@
|
||||||
/examples/example99*
|
/examples/example99*
|
||||||
/translations/*.pot
|
/translations/*.pot
|
||||||
/translations/de
|
/translations/de
|
||||||
|
/CMakeUserPresets.json
|
||||||
|
/launch.json
|
||||||
|
|
|
@ -1,11 +1,11 @@
|
||||||
cmake_minimum_required(VERSION 3.12...3.18)
|
cmake_minimum_required(VERSION 3.12...3.20)
|
||||||
|
|
||||||
# Global build options.
|
# Global build options.
|
||||||
set(CMAKE_BUILD_TYPE "Release" CACHE STRING "The type of build.")
|
set(CMAKE_BUILD_TYPE "Release" CACHE STRING "The type of build.")
|
||||||
set(XGETTEXT_CMD "xgettext" CACHE STRING "The command for xgettext.")
|
set(XGETTEXT_CMD "xgettext" CACHE STRING "The command for xgettext.")
|
||||||
|
|
||||||
project(epubgrep
|
project(epubgrep
|
||||||
VERSION 0.5.0
|
VERSION 0.6.2
|
||||||
DESCRIPTION "Search tool for EPUB e-books"
|
DESCRIPTION "Search tool for EPUB e-books"
|
||||||
HOMEPAGE_URL "https://schlomp.space/tastytea/epubgrep"
|
HOMEPAGE_URL "https://schlomp.space/tastytea/epubgrep"
|
||||||
LANGUAGES CXX)
|
LANGUAGES CXX)
|
||||||
|
@ -15,6 +15,7 @@ list(APPEND CMAKE_MODULE_PATH "${PROJECT_SOURCE_DIR}/cmake")
|
||||||
# Project build options.
|
# Project build options.
|
||||||
option(WITH_TESTS "Compile tests." NO)
|
option(WITH_TESTS "Compile tests." NO)
|
||||||
option(FALLBACK_BUNDLED "Fall back to bundled libs." YES)
|
option(FALLBACK_BUNDLED "Fall back to bundled libs." YES)
|
||||||
|
option(WITH_SANITIZERS "Use sanitizers in debug builds." NO)
|
||||||
|
|
||||||
set(CMAKE_CXX_STANDARD 17)
|
set(CMAKE_CXX_STANDARD 17)
|
||||||
set(CMAKE_CXX_STANDARD_REQUIRED ON)
|
set(CMAKE_CXX_STANDARD_REQUIRED ON)
|
||||||
|
@ -46,6 +47,7 @@ find_package(nlohmann_json REQUIRED CONFIG)
|
||||||
add_subdirectory(src)
|
add_subdirectory(src)
|
||||||
|
|
||||||
if(WITH_TESTS)
|
if(WITH_TESTS)
|
||||||
|
include(CTest)
|
||||||
add_subdirectory(tests)
|
add_subdirectory(tests)
|
||||||
endif()
|
endif()
|
||||||
|
|
||||||
|
|
|
@ -0,0 +1,62 @@
|
||||||
|
{
|
||||||
|
"version": 2,
|
||||||
|
"cmakeMinimumRequired": {
|
||||||
|
"major": 3,
|
||||||
|
"minor": 20,
|
||||||
|
"patch": 0
|
||||||
|
},
|
||||||
|
"configurePresets": [
|
||||||
|
{
|
||||||
|
"name": "common",
|
||||||
|
"hidden": true,
|
||||||
|
"generator": "Unix Makefiles",
|
||||||
|
"binaryDir": "build",
|
||||||
|
"cacheVariables": {
|
||||||
|
"CMAKE_EXPORT_COMPILE_COMMANDS": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "dev",
|
||||||
|
"displayName": "Developer config",
|
||||||
|
"description": "Build with debug symbols and tests enabled",
|
||||||
|
"inherits": "common",
|
||||||
|
"cacheVariables": {
|
||||||
|
"CMAKE_BUILD_TYPE": "Debug",
|
||||||
|
"WITH_TESTS": true,
|
||||||
|
"WITH_SANITIZERS": false
|
||||||
|
}
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "dev_san",
|
||||||
|
"displayName": "Developer config, with sanitizers",
|
||||||
|
"description": "Build with debug symbols, tests enabled and sanitizers enabled",
|
||||||
|
"inherits": "dev",
|
||||||
|
"cacheVariables": {
|
||||||
|
"WITH_SANITIZERS": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "release",
|
||||||
|
"displayName": "Release config",
|
||||||
|
"description": "Build without debug symbols or tests",
|
||||||
|
"inherits": "common",
|
||||||
|
"cacheVariables": {
|
||||||
|
"CMAKE_BUILD_TYPE": "Release",
|
||||||
|
"WITH_TESTS": false
|
||||||
|
}
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"testPresets": [
|
||||||
|
{
|
||||||
|
"name": "default",
|
||||||
|
"configurePreset": "dev",
|
||||||
|
"output": {
|
||||||
|
"outputOnFailure": true
|
||||||
|
},
|
||||||
|
"execution": {
|
||||||
|
"noTestsAction": "error",
|
||||||
|
"stopOnFailure": true
|
||||||
|
}
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
|
@ -63,9 +63,8 @@ directory. Then do the following:
|
||||||
|
|
||||||
[source,shell]
|
[source,shell]
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
cd build
|
cmake --build build
|
||||||
cmake --build .
|
cd translations
|
||||||
cd ../translations
|
|
||||||
msgmerge --update es.po epubgrep.pot
|
msgmerge --update es.po epubgrep.pot
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
|
64
README.adoc
64
README.adoc
|
@ -64,8 +64,8 @@ sudo apt install epubgrep
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
Replace _[code name]_ with the code name of your installation. Packages are
|
Replace _[code name]_ with the code name of your installation. Packages are
|
||||||
available for *buster* (Debian 10), *focal* (Ubuntu 20.04) and *bionic* (Ubuntu
|
available for *bullseye* (Debian 11), *buster* (Debian 10), *focal* (Ubuntu
|
||||||
18.04).
|
20.04) and *bionic* (Ubuntu 18.04).
|
||||||
|
|
||||||
[TIP]
|
[TIP]
|
||||||
If you get the error message that `add-apt-repository` was not found, install
|
If you get the error message that `add-apt-repository` was not found, install
|
||||||
|
@ -76,7 +76,7 @@ If you get the error message that `add-apt-repository` was not found, install
|
||||||
==== Dependencies
|
==== Dependencies
|
||||||
|
|
||||||
* Tested OS: Linux
|
* Tested OS: Linux
|
||||||
* C\++ compiler with C++17 support (tested: link:{uri-gcc}[GCC] 8/10,
|
* C\++ compiler with C++17 support (tested: link:{uri-gcc}[GCC] 8/9/10,
|
||||||
link:{uri-clang}[clang] 6/11)
|
link:{uri-clang}[clang] 6/11)
|
||||||
* link:{uri-cmake}[CMake] (at least: 3.12)
|
* link:{uri-cmake}[CMake] (at least: 3.12)
|
||||||
* link:{uri-boost}[Boost] (tested: 1.75.0 / 1.65.0)
|
* link:{uri-boost}[Boost] (tested: 1.75.0 / 1.65.0)
|
||||||
|
@ -94,8 +94,7 @@ If you get the error message that `add-apt-repository` was not found, install
|
||||||
===== Install dependencies in Debian or Ubuntu
|
===== Install dependencies in Debian or Ubuntu
|
||||||
|
|
||||||
Or distributions that are derived from Debian or Ubuntu. You will need at least
|
Or distributions that are derived from Debian or Ubuntu. You will need at least
|
||||||
Debian buster (10) or Ubuntu focal (20.04), unless you install a newer version
|
Debian buster (10) or Ubuntu focal (20.04).
|
||||||
of CMake.
|
|
||||||
|
|
||||||
[source,shell]
|
[source,shell]
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
@ -105,8 +104,21 @@ sudo apt install build-essential cmake libboost-program-options-dev \
|
||||||
nlohmann-json-dev
|
nlohmann-json-dev
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
[NOTE]
|
[TIP]
|
||||||
If `nlohmann-json-dev` can not be found, try nlohmann-json3-dev.
|
If `nlohmann-json-dev` can not be found, try `nlohmann-json3-dev`.
|
||||||
|
|
||||||
|
===== Install dependencies in openSUSE
|
||||||
|
|
||||||
|
Tested on openSUSE Leap 15.3.
|
||||||
|
|
||||||
|
[source,shell]
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
sudo zypper install cmake gcc10-c++ rpm-build \
|
||||||
|
libboost_program_options1_75_0-devel \
|
||||||
|
libboost_locale1_75_0-devel libboost_log1_75_0-devel \
|
||||||
|
fmt-devel libarchive-devel pugixml-devel \
|
||||||
|
nlohmann_json-devel asciidoc
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
==== Get sourcecode
|
==== Get sourcecode
|
||||||
|
|
||||||
|
@ -132,18 +144,50 @@ cmake -S . -B build
|
||||||
cmake --build build --parallel $(nproc --ignore=1)
|
cmake --build build --parallel $(nproc --ignore=1)
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
To install, run `sudo cmake --install build`. To run the tests, run `cd
|
To install, run `sudo cmake --install build`. To run the tests, run `ctest
|
||||||
build/tests && ctest`.
|
--test-dir build`.
|
||||||
|
|
||||||
[TIP]
|
[TIP]
|
||||||
If you are using Debian or Ubuntu, or a distribution that is derived from these,
|
If you are using Debian or Ubuntu, or a distribution that is derived from these,
|
||||||
you can run `cpack -G DEB` in the build directory to generate a .deb-file. You
|
you can run `cpack -G DEB` in the build directory to generate a .deb-file. You
|
||||||
can then install it with `apt install ./epubgrep-*.deb`.
|
can then install it with `+++apt install ./epubgrep-*.deb+++`.
|
||||||
|
If you are using a distribution that uses RPM packages, like openSUSE or Fedora,
|
||||||
|
you can generate a package with `cpack -G RPM` and install it with `+++zypper
|
||||||
|
install ./epubgrep-*.rpm+++` or `+++dnf install ./epubgrep-*.rpm+++`.
|
||||||
|
|
||||||
.CMake options:
|
.CMake options:
|
||||||
* `-DCMAKE_BUILD_TYPE=Debug` for a debug build.
|
* `-DCMAKE_BUILD_TYPE=Debug` for a debug build.
|
||||||
* `-DWITH_TESTS=YES` if you want to compile the tests.
|
* `-DWITH_TESTS=YES` if you want to compile the tests.
|
||||||
* `-DXGETTEXT_CMD=String` The program to use instead of `xgettext`.
|
* `-DXGETTEXT_CMD=String` The program to use instead of `xgettext`.
|
||||||
* `-DFALLBACK_BUNDLED=NO` if you don't want to fall back on bundled libraries.
|
* `-DFALLBACK_BUNDLED=NO` if you don't want to fall back on bundled libraries.
|
||||||
|
* `-DWITH_SANITIZER=YES` to use sanitizers in debug builds.
|
||||||
|
|
||||||
|
== Similar projects
|
||||||
|
|
||||||
|
* link:https://github.com/phiresky/ripgrep-all[ripgrep-all] can search EPUB
|
||||||
|
files and strips HTML, but does not display page numbers or headings.
|
||||||
|
* zipgrep from link:http://infozip.sourceforge.net/[unzip] can search EPUB files
|
||||||
|
but does not strip HTML and does not display page numbers or headings.
|
||||||
|
|
||||||
|
== Performance
|
||||||
|
|
||||||
|
A test with a directory containing 3333 EPUBs and 6269 files in total showed
|
||||||
|
this difference between epubgrep-0.6.2 and ripgrep-all-0.9.6:
|
||||||
|
|
||||||
|
[source,shellsession]
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
% hyperfine "epubgrep 'floor' ~/Books" "rga 'floor' ~/Books"
|
||||||
|
Benchmark #1: epubgrep 'floor' ~/Books
|
||||||
|
Time (mean ± σ): 167.246 s ± 3.848 s [User: 176.251 s, System: 79.107 s]
|
||||||
|
Range (min … max): 161.533 s … 173.647 s 10 runs
|
||||||
|
|
||||||
|
Benchmark #2: rga 'floor' ~/Books
|
||||||
|
Time (mean ± σ): 9.219 s ± 0.506 s [User: 17.540 s, System: 12.773 s]
|
||||||
|
Range (min … max): 8.571 s … 9.923 s 10 runs
|
||||||
|
|
||||||
|
Summary
|
||||||
|
'rga 'floor' ~/Books' ran
|
||||||
|
18.14 ± 1.08 times faster than 'epubgrep 'floor' ~/Books'
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
include::{uri-base}/raw/branch/main/CONTRIBUTING.adoc[]
|
include::{uri-base}/raw/branch/main/CONTRIBUTING.adoc[]
|
||||||
|
|
|
@ -24,9 +24,13 @@ if(CMAKE_CXX_COMPILER_ID MATCHES "GNU" OR CMAKE_CXX_COMPILER_ID MATCHES "Clang"
|
||||||
"-Wdouble-promotion"
|
"-Wdouble-promotion"
|
||||||
"-Wformat=2"
|
"-Wformat=2"
|
||||||
"-ftrapv"
|
"-ftrapv"
|
||||||
"-fsanitize=undefined"
|
|
||||||
"-Og"
|
"-Og"
|
||||||
"-fno-omit-frame-pointer")
|
"-fno-omit-frame-pointer")
|
||||||
|
if(WITH_SANITIZERS)
|
||||||
|
list(APPEND tmp_CXXFLAGS
|
||||||
|
"-fsanitize=undefined"
|
||||||
|
"-fsanitize=address")
|
||||||
|
endif()
|
||||||
if(CMAKE_CXX_COMPILER_ID MATCHES "GNU")
|
if(CMAKE_CXX_COMPILER_ID MATCHES "GNU")
|
||||||
list(APPEND tmp_CXXFLAGS
|
list(APPEND tmp_CXXFLAGS
|
||||||
"-Wlogical-op"
|
"-Wlogical-op"
|
||||||
|
@ -44,8 +48,11 @@ if(CMAKE_CXX_COMPILER_ID MATCHES "GNU" OR CMAKE_CXX_COMPILER_ID MATCHES "Clang"
|
||||||
endif()
|
endif()
|
||||||
add_compile_options("$<$<CONFIG:Debug>:${tmp_CXXFLAGS}>")
|
add_compile_options("$<$<CONFIG:Debug>:${tmp_CXXFLAGS}>")
|
||||||
|
|
||||||
list(APPEND tmp_LDFLAGS
|
if(WITH_SANITIZERS)
|
||||||
"-fsanitize=undefined")
|
list(APPEND tmp_LDFLAGS
|
||||||
|
"-fsanitize=undefined"
|
||||||
|
"-fsanitize=address")
|
||||||
|
endif()
|
||||||
# add_link_options was introduced in version 3.13.
|
# add_link_options was introduced in version 3.13.
|
||||||
if(${CMAKE_VERSION} VERSION_LESS 3.13)
|
if(${CMAKE_VERSION} VERSION_LESS 3.13)
|
||||||
set(CMAKE_SHARED_LINKER_FLAGS_DEBUG "${tmp_LDFLAGS}")
|
set(CMAKE_SHARED_LINKER_FLAGS_DEBUG "${tmp_LDFLAGS}")
|
||||||
|
|
|
@ -6,7 +6,9 @@ set(CPACK_PACKAGE_CONTACT "tastytea <tastytea@tastytea.de>")
|
||||||
# Should be set automatically, but they are not.
|
# Should be set automatically, but they are not.
|
||||||
set(CPACK_PACKAGE_NAME "${PROJECT_NAME}")
|
set(CPACK_PACKAGE_NAME "${PROJECT_NAME}")
|
||||||
set(CPACK_PACKAGE_VERSION "${PROJECT_VERSION}")
|
set(CPACK_PACKAGE_VERSION "${PROJECT_VERSION}")
|
||||||
|
set(CPACK_PACKAGE_DESCRIPTION_SUMMARY "${CMAKE_PROJECT_DESCRIPTION}")
|
||||||
|
|
||||||
|
# DEB
|
||||||
# Figure out dependencies automatically.
|
# Figure out dependencies automatically.
|
||||||
set(CPACK_DEBIAN_PACKAGE_SHLIBDEPS ON)
|
set(CPACK_DEBIAN_PACKAGE_SHLIBDEPS ON)
|
||||||
|
|
||||||
|
@ -26,4 +28,30 @@ endif()
|
||||||
set(CPACK_DEBIAN_FILE_NAME
|
set(CPACK_DEBIAN_FILE_NAME
|
||||||
"${CPACK_PACKAGE_NAME}_${CPACK_PACKAGE_VERSION}-0_${CPACK_DEBIAN_PACKAGE_ARCHITECTURE}_${DEBIAN_CODENAME}.deb")
|
"${CPACK_PACKAGE_NAME}_${CPACK_PACKAGE_VERSION}-0_${CPACK_DEBIAN_PACKAGE_ARCHITECTURE}_${DEBIAN_CODENAME}.deb")
|
||||||
|
|
||||||
|
# RPM
|
||||||
|
set(CPACK_RPM_PACKAGE_LICENSE "AGPL-3")
|
||||||
|
|
||||||
|
# Figure out dependencies automatically.
|
||||||
|
set(CPACK_RPM_PACKAGE_AUTOREQ ON)
|
||||||
|
|
||||||
|
# Should be set automatically, but it is not.
|
||||||
|
execute_process(COMMAND uname -m
|
||||||
|
OUTPUT_VARIABLE CPACK_RPM_PACKAGE_ARCHITECTURE
|
||||||
|
OUTPUT_STRIP_TRAILING_WHITESPACE)
|
||||||
|
|
||||||
|
set(CPACK_PACKAGE_FILE_NAME
|
||||||
|
"${CPACK_PACKAGE_NAME}-${CPACK_PACKAGE_VERSION}-0.${CPACK_RPM_PACKAGE_ARCHITECTURE}")
|
||||||
|
|
||||||
|
execute_process(COMMAND lsb_release --id --short
|
||||||
|
OUTPUT_VARIABLE OS
|
||||||
|
OUTPUT_STRIP_TRAILING_WHITESPACE)
|
||||||
|
|
||||||
|
if("${OS}" STREQUAL "openSUSE")
|
||||||
|
execute_process(COMMAND lsb_release --release --short
|
||||||
|
OUTPUT_VARIABLE OS_RELEASE
|
||||||
|
OUTPUT_STRIP_TRAILING_WHITESPACE)
|
||||||
|
set(CPACK_PACKAGE_FILE_NAME
|
||||||
|
"${CPACK_PACKAGE_NAME}-${CPACK_PACKAGE_VERSION}-0.${CPACK_RPM_PACKAGE_ARCHITECTURE}.opensuse-${OS_RELEASE}")
|
||||||
|
endif()
|
||||||
|
|
||||||
include(CPack)
|
include(CPack)
|
||||||
|
|
|
@ -2,7 +2,7 @@
|
||||||
:doctype: manpage
|
:doctype: manpage
|
||||||
:Author: tastytea
|
:Author: tastytea
|
||||||
:Email: tastytea@tastytea.de
|
:Email: tastytea@tastytea.de
|
||||||
:Date: 2021-06-01
|
:Date: 2021-07-02
|
||||||
:Revision: 0.0.0
|
:Revision: 0.0.0
|
||||||
:man source: epubgrep
|
:man source: epubgrep
|
||||||
:man manual: General Commands Manual
|
:man manual: General Commands Manual
|
||||||
|
@ -13,7 +13,7 @@ epubgrep - Search tool for EPUB e-books.
|
||||||
|
|
||||||
== SYNOPSIS
|
== SYNOPSIS
|
||||||
|
|
||||||
*epubgrep* [_OPTION_]… _PATTERN_ [_FILE_]…
|
*epubgrep* [_OPTION_]… _PATTERN_ _FILE_…
|
||||||
|
|
||||||
== DESCRIPTION
|
== DESCRIPTION
|
||||||
|
|
||||||
|
@ -21,14 +21,44 @@ epubgrep - Search tool for EPUB e-books.
|
||||||
for command line switches where possible. However, not all grep switches are
|
for command line switches where possible. However, not all grep switches are
|
||||||
implemented and some additional switches are added.
|
implemented and some additional switches are added.
|
||||||
|
|
||||||
|
This manual is also available at
|
||||||
|
<https://man.schlomp.space/tastytea/?program=epubgrep>.
|
||||||
|
|
||||||
|
== EXAMPLES
|
||||||
|
|
||||||
|
.Search for Apple(s) or Orange(s) with 2 words of context around the matches, case insensitively
|
||||||
|
[source,shell]
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
epubgrep -PiC2 '(Apple|Orange)s?' file.epub
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
.Extract external hyperlinks
|
||||||
|
[source,shell]
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
epubgrep -PC0 --raw --no-filename=all '"http[^"]+"' file.epub | tr -d '"'
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
|
.Save the search results to an HTML file and output a status message every 20 seconds
|
||||||
|
[source,shell]
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
epubgrep -C2 --status --status-interval=20 --html 'Apples' file.epub > result.html
|
||||||
|
--------------------------------------------------------------------------------
|
||||||
|
|
||||||
== OPTIONS
|
== OPTIONS
|
||||||
|
|
||||||
|
=== General options
|
||||||
|
|
||||||
*-h*, *--help*::
|
*-h*, *--help*::
|
||||||
Display a short help message and exit.
|
Display a short help message and exit.
|
||||||
|
|
||||||
*V*, *--version*::
|
*V*, *--version*::
|
||||||
Show version, copyright and license.
|
Show version, copyright and license.
|
||||||
|
|
||||||
|
*--debug*::
|
||||||
|
Write debug output to the terminal and log file.
|
||||||
|
|
||||||
|
=== Search options
|
||||||
|
|
||||||
*-G*, *--basic-regexp*::
|
*-G*, *--basic-regexp*::
|
||||||
_PATTERN_ is a POSIX basic regular expression. This is the default.
|
_PATTERN_ is a POSIX basic regular expression. This is the default.
|
||||||
|
|
||||||
|
@ -46,25 +76,10 @@ _PATTERN_ is a Perl regular expression.
|
||||||
*-i*, *--ignore-case*::
|
*-i*, *--ignore-case*::
|
||||||
Ignore case distinctions in pattern and data.
|
Ignore case distinctions in pattern and data.
|
||||||
|
|
||||||
*-e* _PATTERN_, *--regexp* _PATTERN_::
|
|
||||||
Use additional _PATTERN_ for matching. Can be used more than once.
|
|
||||||
|
|
||||||
*-a*, *--raw*::
|
*-a*, *--raw*::
|
||||||
Do not clean up text before searching. No HTML stripping, no newline removal,
|
Do not clean up text before searching. No HTML stripping, no newline removal,
|
||||||
all files will be read (not just the text documents listed in the spine).
|
all files will be read (not just the text documents listed in the spine).
|
||||||
|
|
||||||
*-C* _NUMBER_, *context* _NUMBER_::
|
|
||||||
Print _NUMBER_ words of context around matches.
|
|
||||||
|
|
||||||
*--nocolor*::
|
|
||||||
Turn off colors and other decorations.
|
|
||||||
|
|
||||||
*--no-filename* _WHICH_::
|
|
||||||
|
|
||||||
Suppress the mentioning of file names on output. _WHICH_ is ‘filesystem’ for the
|
|
||||||
file names on your file systems, ‘in-epub’ for the file names inside the EPUB or
|
|
||||||
‘all’. Chapters and page numbers will still be output.
|
|
||||||
|
|
||||||
*-r*, *--recursive*::
|
*-r*, *--recursive*::
|
||||||
Read all files under each directory, recursively, following symbolic links only
|
Read all files under each directory, recursively, following symbolic links only
|
||||||
if they are on the command line. Silently skips directories that are not
|
if they are on the command line. Silently skips directories that are not
|
||||||
|
@ -74,20 +89,44 @@ readable by the user.
|
||||||
Read all files under each directory, recursively. Follow all symbolic
|
Read all files under each directory, recursively. Follow all symbolic
|
||||||
links. Silently skips directories that are not readable by the user.
|
links. Silently skips directories that are not readable by the user.
|
||||||
|
|
||||||
|
*-e* _PATTERN_, *--regexp* _PATTERN_::
|
||||||
|
Use additional _PATTERN_ for matching. Can be used more than once.
|
||||||
|
|
||||||
|
=== Output options
|
||||||
|
|
||||||
|
*-C* _NUMBER_, *context* _NUMBER_::
|
||||||
|
Print _NUMBER_ words of context around matches.
|
||||||
|
|
||||||
|
*--nocolor*::
|
||||||
|
Turn off colors and other decorations.
|
||||||
|
|
||||||
|
*--no-filename* _WHICH_::
|
||||||
|
Suppress the mentioning of file names on output. _WHICH_ is ‘filesystem’ for the
|
||||||
|
file names on your file systems, ‘in-epub’ for the file names inside the EPUB or
|
||||||
|
‘all’. Chapters and page numbers will still be output.
|
||||||
|
|
||||||
*--ignore-archive-errors*::
|
*--ignore-archive-errors*::
|
||||||
Ignore errors about wrong file formats. When you search directories recursively,
|
Ignore errors about wrong file formats. When you search directories recursively,
|
||||||
it is likely that there are files which are not EPUB files. This setting
|
it is likely that there are files which are not EPUB files. This setting
|
||||||
suppresses errors related to them.
|
suppresses errors related to them.
|
||||||
|
|
||||||
*--debug*::
|
|
||||||
Write debug output to the terminal and log file.
|
|
||||||
|
|
||||||
*--json*::
|
*--json*::
|
||||||
Output JSON instead of plain text. JSON will only be output at the end of the
|
Output JSON instead of plain text. JSON will only be output at the end of the
|
||||||
program. There will be an object named `generator` with the property
|
program. There will be an object named `generator` with the property
|
||||||
`epubgrep`. The value is the version of the program, as string. The matches are
|
`epubgrep`. The value is the version of the program, as string. The matches are
|
||||||
in an array named `matches`. I will try not to break the API. 😊
|
in an array named `matches`. I will try not to break the API. 😊
|
||||||
|
|
||||||
|
*--html*::
|
||||||
|
Output HTML instead of plain text. HTML will only be output at the end of the
|
||||||
|
program.
|
||||||
|
|
||||||
|
*--status*::
|
||||||
|
Output status message every *--status-interval* seconds to standard
|
||||||
|
error. Default is 30.
|
||||||
|
|
||||||
|
*--status-interval* _NUMBER_::
|
||||||
|
Set status message interval to _NUMBER_ seconds.
|
||||||
|
|
||||||
== USAGE
|
== USAGE
|
||||||
|
|
||||||
[source,shellsession]
|
[source,shellsession]
|
||||||
|
@ -119,15 +158,16 @@ occur more than once are merged.
|
||||||
|
|
||||||
==== Example configuration file
|
==== Example configuration file
|
||||||
|
|
||||||
This example makes epubgrep ignore files which are not EPUB, suppress the file
|
This example makes epubgrep always search directories recursively, ignore files
|
||||||
names on output, print 2 words of context around matches (unless overridden on
|
which are not EPUB, not print the file names inside the EPUB, print 2 words of
|
||||||
the command line) and search for mentions of the words thyme and oregano in
|
context around matches (unless overridden on the command line) and search for
|
||||||
every book.
|
mentions of the words thyme and oregano in every book.
|
||||||
|
|
||||||
[source,cfg]
|
[source,cfg]
|
||||||
--------------------------------------------------------------------------------
|
--------------------------------------------------------------------------------
|
||||||
|
recursive = 1
|
||||||
ignore-archive-errors = 1
|
ignore-archive-errors = 1
|
||||||
no-filename = 1
|
no-filename = in-epub
|
||||||
context = 2
|
context = 2
|
||||||
regexp = [Tt]hyme
|
regexp = [Tt]hyme
|
||||||
regexp = [Oo]regano
|
regexp = [Oo]regano
|
||||||
|
|
BIN
screenshot.png
BIN
screenshot.png
Binary file not shown.
Before Width: | Height: | Size: 116 KiB After Width: | Height: | Size: 130 KiB |
|
@ -0,0 +1,306 @@
|
||||||
|
/* This file is part of epubgrep.
|
||||||
|
* Copyright © 2021 tastytea <tastytea@tastytea.de>
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU Affero General Public License as published by
|
||||||
|
* the Free Software Foundation, version 3.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU Affero General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU Affero General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#include "book.hpp"
|
||||||
|
|
||||||
|
#include "fs-compat.hpp"
|
||||||
|
#include "helpers.hpp"
|
||||||
|
#include "log.hpp"
|
||||||
|
#include "zip.hpp"
|
||||||
|
|
||||||
|
#include <boost/locale/message.hpp>
|
||||||
|
#include <boost/regex.hpp>
|
||||||
|
#include <fmt/format.h>
|
||||||
|
#include <fmt/ostream.h> // For compatibility with fmt 4.
|
||||||
|
#include <pugixml.hpp>
|
||||||
|
|
||||||
|
#include <algorithm>
|
||||||
|
#include <memory>
|
||||||
|
#include <string>
|
||||||
|
#include <string_view>
|
||||||
|
#include <vector>
|
||||||
|
|
||||||
|
namespace epubgrep::book
|
||||||
|
{
|
||||||
|
|
||||||
|
using boost::locale::translate;
|
||||||
|
using fmt::format;
|
||||||
|
using std::string;
|
||||||
|
|
||||||
|
book read(const fs::path filepath, const bool raw)
|
||||||
|
{
|
||||||
|
using helpers::unescape_html;
|
||||||
|
|
||||||
|
DEBUGLOG << "Processing book " << filepath;
|
||||||
|
|
||||||
|
std::vector<string> epub_filepaths{[&filepath, raw]
|
||||||
|
{
|
||||||
|
if (!raw)
|
||||||
|
{
|
||||||
|
return list_spine(filepath);
|
||||||
|
}
|
||||||
|
return zip::list(filepath);
|
||||||
|
}()};
|
||||||
|
|
||||||
|
book current_book;
|
||||||
|
current_book.language = [&filepath]() -> string
|
||||||
|
{
|
||||||
|
try
|
||||||
|
{
|
||||||
|
pugi::xml_document xml;
|
||||||
|
auto opf_file_path{get_opf_file_path(filepath)};
|
||||||
|
const std::string opf_file{
|
||||||
|
zip::read_file(filepath, opf_file_path.string())};
|
||||||
|
|
||||||
|
const auto result{xml.load_buffer(&opf_file[0], opf_file.size())};
|
||||||
|
if (result)
|
||||||
|
{
|
||||||
|
auto lang{xml.child("package")
|
||||||
|
.child("metadata")
|
||||||
|
.child("dc:language")};
|
||||||
|
if (lang == nullptr)
|
||||||
|
{
|
||||||
|
lang = xml.child("opf:package")
|
||||||
|
.child("opf:metadata")
|
||||||
|
.child("dc:language");
|
||||||
|
}
|
||||||
|
return lang.text().as_string();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
catch (epubgrep::zip::exception &e)
|
||||||
|
{
|
||||||
|
if (e.code != 1) // 1 == container.xml not found.
|
||||||
|
{
|
||||||
|
LOG(log::sev::error) << e.what();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return "";
|
||||||
|
}();
|
||||||
|
DEBUGLOG << "Book language detected: " << current_book.language;
|
||||||
|
|
||||||
|
for (const auto &entry : epub_filepaths)
|
||||||
|
{
|
||||||
|
DEBUGLOG << "Processing document " << entry;
|
||||||
|
document doc;
|
||||||
|
if (!raw)
|
||||||
|
{
|
||||||
|
doc = process_page(unescape_html(zip::read_file(filepath, entry)));
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
doc.text_raw = zip::read_file(filepath, entry);
|
||||||
|
doc.text = std::make_unique<std::string>(doc.text_raw);
|
||||||
|
}
|
||||||
|
doc.language = current_book.language; // FIXME: Get language of doc.
|
||||||
|
current_book.files.emplace_back(entry, std::move(doc));
|
||||||
|
}
|
||||||
|
|
||||||
|
return current_book;
|
||||||
|
}
|
||||||
|
|
||||||
|
document process_page(const std::string_view text)
|
||||||
|
{
|
||||||
|
string output{text};
|
||||||
|
static const boost::regex re_header_start{"<[hH][1-6]"};
|
||||||
|
static const boost::regex re_header_end{"</[hH][1-6]"};
|
||||||
|
static const boost::regex re_pagebreak{"[^>]+pagebreak[^>]+"
|
||||||
|
"(title|aria-label)"
|
||||||
|
"=\"([[:alnum:]]+)\""};
|
||||||
|
|
||||||
|
{
|
||||||
|
size_t pos{0};
|
||||||
|
while ((pos = output.find_first_of("\n\t\r", pos)) != string::npos)
|
||||||
|
{
|
||||||
|
if (output[pos] == '\r')
|
||||||
|
{
|
||||||
|
output.erase(pos, 1);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
output.replace(pos, 1, " ");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
{
|
||||||
|
size_t pos{0};
|
||||||
|
while ((pos = output.find(" ", pos)) != string::npos)
|
||||||
|
{
|
||||||
|
output.replace(pos, 2, " ");
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
size_t pos{0};
|
||||||
|
document doc;
|
||||||
|
size_t headline_start{string::npos};
|
||||||
|
while ((pos = output.find('<', pos)) != string::npos)
|
||||||
|
{
|
||||||
|
auto endpos{output.find('>', pos) + 1};
|
||||||
|
|
||||||
|
if (boost::regex_match(output.substr(pos, 3), re_header_start))
|
||||||
|
{
|
||||||
|
headline_start = pos;
|
||||||
|
}
|
||||||
|
else if (boost::regex_match(output.substr(pos, 4), re_header_end))
|
||||||
|
{
|
||||||
|
if (headline_start != string::npos)
|
||||||
|
{
|
||||||
|
doc.headlines.insert(
|
||||||
|
{headline_start,
|
||||||
|
output.substr(headline_start, pos - headline_start)});
|
||||||
|
headline_start = string::npos;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else if (output.substr(pos, 6) == "<span ")
|
||||||
|
{
|
||||||
|
boost::match_results<string::const_iterator> match;
|
||||||
|
using it_size_t = string::const_iterator::difference_type;
|
||||||
|
string::const_iterator begin{output.begin()
|
||||||
|
+ static_cast<it_size_t>(pos)};
|
||||||
|
string::const_iterator end{output.begin()
|
||||||
|
+ static_cast<it_size_t>(endpos)};
|
||||||
|
|
||||||
|
if (boost::regex_search(begin, end, match, re_pagebreak))
|
||||||
|
{
|
||||||
|
doc.pages.insert({pos, match[2].str()});
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else if (output.substr(pos, 7) == "<style "
|
||||||
|
|| output.substr(pos, 8) == "<script ")
|
||||||
|
{
|
||||||
|
if (output.find("/>", pos) > endpos)
|
||||||
|
{
|
||||||
|
endpos = output.find('>', endpos) + 1;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
output.erase(pos, endpos - pos);
|
||||||
|
}
|
||||||
|
|
||||||
|
doc.text_cleaned = output;
|
||||||
|
doc.text = std::make_unique<string>(doc.text_cleaned);
|
||||||
|
|
||||||
|
return doc;
|
||||||
|
}
|
||||||
|
|
||||||
|
std::string headline(const document &doc, const size_t pos)
|
||||||
|
{
|
||||||
|
std::string_view last;
|
||||||
|
|
||||||
|
for (const auto &pair : doc.headlines)
|
||||||
|
{
|
||||||
|
if (pair.first > pos)
|
||||||
|
{
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
last = pair.second;
|
||||||
|
}
|
||||||
|
|
||||||
|
return string(last);
|
||||||
|
}
|
||||||
|
|
||||||
|
string page(const document &doc, const size_t pos)
|
||||||
|
{
|
||||||
|
std::string_view last;
|
||||||
|
|
||||||
|
for (const auto &pair : doc.pages)
|
||||||
|
{
|
||||||
|
if (pair.first > pos)
|
||||||
|
{
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
last = pair.second;
|
||||||
|
}
|
||||||
|
|
||||||
|
return string(last);
|
||||||
|
}
|
||||||
|
|
||||||
|
fs::path get_opf_file_path(const fs::path &zipfile)
|
||||||
|
{
|
||||||
|
pugi::xml_document xml;
|
||||||
|
const std::string container{
|
||||||
|
zip::read_file(zipfile, "META-INF/container.xml")};
|
||||||
|
const auto result{xml.load_buffer(&container[0], container.size())};
|
||||||
|
if (result)
|
||||||
|
{
|
||||||
|
return fs::path{xml.child("container")
|
||||||
|
.child("rootfiles")
|
||||||
|
.first_child()
|
||||||
|
.attribute("full-path")
|
||||||
|
.value()};
|
||||||
|
}
|
||||||
|
LOG(log::sev::error) << result.description() << '\n';
|
||||||
|
|
||||||
|
return fs::path{};
|
||||||
|
}
|
||||||
|
|
||||||
|
std::vector<string> list_spine(const fs::path &filepath)
|
||||||
|
{
|
||||||
|
auto opf_file_path{get_opf_file_path(filepath)};
|
||||||
|
std::vector<std::string> spine_filepaths;
|
||||||
|
if (!opf_file_path.empty())
|
||||||
|
{
|
||||||
|
DEBUGLOG << "Parsing " << opf_file_path;
|
||||||
|
pugi::xml_document xml;
|
||||||
|
const std::string opf_file{
|
||||||
|
zip::read_file(filepath, opf_file_path.string())};
|
||||||
|
const auto result{xml.load_buffer(&opf_file[0], opf_file.size())};
|
||||||
|
if (result)
|
||||||
|
{
|
||||||
|
auto manifest{xml.child("package").child("manifest")};
|
||||||
|
if (manifest == nullptr)
|
||||||
|
{
|
||||||
|
manifest = xml.child("opf:package").child("opf:manifest");
|
||||||
|
}
|
||||||
|
auto spine{xml.child("package").child("spine")};
|
||||||
|
if (spine == nullptr)
|
||||||
|
{
|
||||||
|
spine = xml.child("opf:package").child("opf:spine");
|
||||||
|
}
|
||||||
|
|
||||||
|
for (const auto &itemref : spine)
|
||||||
|
{
|
||||||
|
const auto &idref{itemref.attribute("idref").value()};
|
||||||
|
const auto &item{manifest.find_child_by_attribute("id", idref)};
|
||||||
|
auto href{helpers::urldecode(item.attribute("href").value())};
|
||||||
|
if (href[0] != '/')
|
||||||
|
{
|
||||||
|
href = (opf_file_path.parent_path() /= href);
|
||||||
|
}
|
||||||
|
DEBUGLOG << "Found in spine: " << href;
|
||||||
|
spine_filepaths.emplace_back(href);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
LOG(log::sev::error) << "XML: " << result.description() << '\n';
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (opf_file_path.empty() || spine_filepaths.empty())
|
||||||
|
{
|
||||||
|
LOG(log::sev::error)
|
||||||
|
<< format(translate("{0:s} is damaged. Could not read spine. "
|
||||||
|
"Skipping file.\n")
|
||||||
|
.str()
|
||||||
|
.c_str(),
|
||||||
|
filepath.c_str());
|
||||||
|
return {};
|
||||||
|
}
|
||||||
|
|
||||||
|
return spine_filepaths;
|
||||||
|
}
|
||||||
|
|
||||||
|
} // namespace epubgrep::book
|
|
@ -0,0 +1,73 @@
|
||||||
|
/* This file is part of epubgrep.
|
||||||
|
* Copyright © 2021 tastytea <tastytea@tastytea.de>
|
||||||
|
*
|
||||||
|
* This program is free software: you can redistribute it and/or modify
|
||||||
|
* it under the terms of the GNU Affero General Public License as published by
|
||||||
|
* the Free Software Foundation, version 3.
|
||||||
|
*
|
||||||
|
* This program is distributed in the hope that it will be useful,
|
||||||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||||||
|
* GNU Affero General Public License for more details.
|
||||||
|
*
|
||||||
|
* You should have received a copy of the GNU Affero General Public License
|
||||||
|
* along with this program. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
*/
|
||||||
|
|
||||||
|
#ifndef EPUBGREP_BOOK_HPP
|
||||||
|
#define EPUBGREP_BOOK_HPP
|
||||||
|
|
||||||
|
#include "fs-compat.hpp"
|
||||||
|
|
||||||
|
#include <map>
|
||||||
|
#include <memory>
|
||||||
|
#include <string>
|
||||||
|
#include <string_view>
|
||||||
|
#include <utility>
|
||||||
|
#include <vector>
|
||||||
|
|
||||||
|
namespace epubgrep::book
|
||||||
|
{
|
||||||
|
|
||||||
|
using std::string;
|
||||||
|
|
||||||
|
//! Document inside EPUB.
|
||||||
|
struct document
|
||||||
|
{
|
||||||
|
string text_raw; //!< HTML page
|
||||||
|
string text_cleaned; //!< Plain text page
|
||||||
|
std::unique_ptr<string> text; //!< Pointer to preferred text version
|
||||||
|
std::map<size_t, string> headlines; //!< pos, title
|
||||||
|
std::map<size_t, string> pages; //!< pos, page
|
||||||
|
string language; //!< Page language
|
||||||
|
} __attribute__((aligned(128)));
|
||||||
|
|
||||||
|
//! EPUB file.
|
||||||
|
struct book
|
||||||
|
{
|
||||||
|
std::vector<std::pair<string, document>> files; //!< filename, file
|
||||||
|
std::vector<std::pair<string, string>> toc; //!< title, href
|
||||||
|
string language; //!< Book language
|
||||||
|
} __attribute__((aligned(128)));
|
||||||
|
|
||||||
|
//! Read and process book.
|
||||||
|
[[nodiscard]] book read(fs::path filepath, bool raw);
|
||||||
|
|
||||||
|
//! Clean up page and record headlines and page numbers.
|
||||||
|
[[nodiscard]] document process_page(std::string_view text);
|
||||||
|
|
||||||
|
//! Return last headline if possible.
|
||||||
|
[[nodiscard]] string headline(const document &doc, size_t pos);
|
||||||
|
|
||||||
|
//! Return current page if possible.
|
||||||
|
[[nodiscard]] string page(const document &doc, size_t pos);
|
||||||
|
|
||||||
|
//! Returns the file path of the OPF file in the EPUB.
|
||||||
|
[[nodiscard]] fs::path get_opf_file_path(const fs::path &zipfile);
|
||||||
|
|
||||||
|
//! Returns the files in the EPUB “spine” (all pages that are actually text).
|
||||||
|
[[nodiscard]] std::vector<string> list_spine(const fs::path &filepath);
|
||||||
|
|
||||||
|
} // namespace epubgrep::book
|
||||||
|
|
||||||
|
#endif // EPUBGREP_BOOK_HPP
|
|
@ -43,7 +43,7 @@ std::string unescape_html(const std::string_view html)
|
||||||
|
|
||||||
// Source: https://en.wikipedia.org/wiki/List_of_XML_and_HTML_character_
|
// Source: https://en.wikipedia.org/wiki/List_of_XML_and_HTML_character_
|
||||||
// entity_references#Character_entity_references_in_HTML
|
// entity_references#Character_entity_references_in_HTML
|
||||||
const std::map<std::string_view, char32_t>
|
static const std::map<std::string_view, char32_t>
|
||||||
names{{"exclamation", 0x0021}, {"quot", 0x0022}, {"percent", 0x0025},
|
names{{"exclamation", 0x0021}, {"quot", 0x0022}, {"percent", 0x0025},
|
||||||
{"amp", 0x0026}, {"apos", 0x0027}, {"add", 0x002B},
|
{"amp", 0x0026}, {"apos", 0x0027}, {"add", 0x002B},
|
||||||
{"lt", 0x003C}, {"equal", 0x003D}, {"gt", 0x003E},
|
{"lt", 0x003C}, {"equal", 0x003D}, {"gt", 0x003E},
|
||||||
|
@ -150,7 +150,7 @@ std::string unescape_html(const std::string_view html)
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
const char32_t codepoint{
|
const char32_t codepoint{
|
||||||
[&match, &names]
|
[&match]
|
||||||
{
|
{
|
||||||
// If it doesn't start with a '#' it is a named entity.
|
// If it doesn't start with a '#' it is a named entity.
|
||||||
if (match[1].str()[0] != '#')
|
if (match[1].str()[0] != '#')
|
||||||
|
@ -184,7 +184,7 @@ std::string unescape_html(const std::string_view html)
|
||||||
|
|
||||||
std::string_view get_env(const std::string_view name)
|
std::string_view get_env(const std::string_view name)
|
||||||
{
|
{
|
||||||
const char *env = std::getenv(name.data());
|
const char *env = std::getenv(name.data()); // NOLINT(concurrency-mt-unsafe)
|
||||||
if (env != nullptr)
|
if (env != nullptr)
|
||||||
{
|
{
|
||||||
return env;
|
return env;
|
||||||
|
|
68
src/main.cpp
68
src/main.cpp
|
@ -28,6 +28,7 @@
|
||||||
#include <fmt/format.h>
|
#include <fmt/format.h>
|
||||||
#include <fmt/ostream.h> // For compatibility with fmt 4.
|
#include <fmt/ostream.h> // For compatibility with fmt 4.
|
||||||
|
|
||||||
|
#include <chrono>
|
||||||
#include <clocale>
|
#include <clocale>
|
||||||
#include <cmath>
|
#include <cmath>
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
@ -45,6 +46,9 @@
|
||||||
#include <thread>
|
#include <thread>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
|
constexpr int EXIT_FATAL{2}; // NOLINT(readability-identifier-naming)
|
||||||
|
|
||||||
|
// NOLINTNEXTLINE(readability-function-cognitive-complexity)
|
||||||
int main(int argc, char *argv[])
|
int main(int argc, char *argv[])
|
||||||
{
|
{
|
||||||
using namespace epubgrep;
|
using namespace epubgrep;
|
||||||
|
@ -56,7 +60,7 @@ int main(int argc, char *argv[])
|
||||||
|
|
||||||
// locale_generator("").name.c_str() returns "*" instead of "". That's why
|
// locale_generator("").name.c_str() returns "*" instead of "". That's why
|
||||||
// the global C locale isn't changed. So we have to set it additionally.
|
// the global C locale isn't changed. So we have to set it additionally.
|
||||||
std::setlocale(LC_ALL, "");
|
std::setlocale(LC_ALL, ""); // NOLINT(concurrency-mt-unsafe)
|
||||||
boost::locale::generator locale_generator;
|
boost::locale::generator locale_generator;
|
||||||
locale_generator.add_messages_path("translations");
|
locale_generator.add_messages_path("translations");
|
||||||
locale_generator.add_messages_path("/usr/share/locale");
|
locale_generator.add_messages_path("/usr/share/locale");
|
||||||
|
@ -77,7 +81,7 @@ int main(int argc, char *argv[])
|
||||||
{ // Exceptions we can't recover from or ones we don't know.
|
{ // Exceptions we can't recover from or ones we don't know.
|
||||||
LOG(log::sev::fatal)
|
LOG(log::sev::fatal)
|
||||||
<< e.what() << translate(" (while parsing options)");
|
<< e.what() << translate(" (while parsing options)");
|
||||||
return EXIT_FAILURE;
|
return EXIT_FATAL;
|
||||||
}
|
}
|
||||||
|
|
||||||
if (opts.debug)
|
if (opts.debug)
|
||||||
|
@ -122,8 +126,10 @@ int main(int argc, char *argv[])
|
||||||
}
|
}
|
||||||
|
|
||||||
LOG(log::sev::error)
|
LOG(log::sev::error)
|
||||||
<< format(translate("Could not open {0:s}: {1:s}").str(),
|
<< format(translate("Could not open {0:s}: {1:s}")
|
||||||
e.path1(), e.what());
|
.str()
|
||||||
|
.c_str(),
|
||||||
|
e.path1().c_str(), e.what());
|
||||||
return_code = EXIT_FAILURE;
|
return_code = EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -139,6 +145,7 @@ int main(int argc, char *argv[])
|
||||||
vector<vector<search::match>> matches_all;
|
vector<vector<search::match>> matches_all;
|
||||||
std::mutex mutex_matches_all;
|
std::mutex mutex_matches_all;
|
||||||
vector<std::future<int>> futurepool;
|
vector<std::future<int>> futurepool;
|
||||||
|
std::atomic<size_t> books_searched{0};
|
||||||
|
|
||||||
auto search_file{
|
auto search_file{
|
||||||
[&opts, &matches_all, &mutex_matches_all,
|
[&opts, &matches_all, &mutex_matches_all,
|
||||||
|
@ -170,18 +177,25 @@ int main(int argc, char *argv[])
|
||||||
catch (const std::ifstream::failure &e)
|
catch (const std::ifstream::failure &e)
|
||||||
{
|
{
|
||||||
LOG(log::sev::error)
|
LOG(log::sev::error)
|
||||||
<< std::strerror(errno)
|
<< std::strerror(errno) // FIXME: Not thread safe.
|
||||||
<< format(translate(" (while opening {0:s})").str(),
|
<< format(translate(" (while opening {0:s})")
|
||||||
filepath);
|
.str()
|
||||||
|
.c_str(),
|
||||||
|
filepath.c_str());
|
||||||
return EXIT_FAILURE;
|
return EXIT_FAILURE;
|
||||||
}
|
}
|
||||||
|
catch (const boost::regex_error &e)
|
||||||
|
{
|
||||||
|
LOG(log::sev::fatal) << e.what();
|
||||||
|
return EXIT_FATAL;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
return EXIT_SUCCESS;
|
return EXIT_SUCCESS;
|
||||||
}};
|
}};
|
||||||
|
|
||||||
auto futures_cleanup{
|
auto futures_cleanup{
|
||||||
[&futurepool, &return_code](const bool wait = false)
|
[&futurepool, &return_code, &books_searched](const bool wait = false)
|
||||||
{
|
{
|
||||||
using namespace std::chrono_literals;
|
using namespace std::chrono_literals;
|
||||||
|
|
||||||
|
@ -201,6 +215,7 @@ int main(int argc, char *argv[])
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
futurepool.erase(it);
|
futurepool.erase(it);
|
||||||
|
++books_searched;
|
||||||
}
|
}
|
||||||
}};
|
}};
|
||||||
|
|
||||||
|
@ -212,6 +227,27 @@ int main(int argc, char *argv[])
|
||||||
}()};
|
}()};
|
||||||
DEBUGLOG << "max_threads = " << max_threads;
|
DEBUGLOG << "max_threads = " << max_threads;
|
||||||
|
|
||||||
|
const auto print_status{
|
||||||
|
[&opts, &books_searched, &input_files](std::future<bool> cancel)
|
||||||
|
{
|
||||||
|
if (!opts.status)
|
||||||
|
{
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
while (cancel.wait_for(std::chrono::seconds(opts.status_interval))
|
||||||
|
!= std::future_status::ready)
|
||||||
|
{
|
||||||
|
std::cerr << format(translate("{0:d} of {1:d} books searched.")
|
||||||
|
.str()
|
||||||
|
.c_str(),
|
||||||
|
books_searched, input_files.size())
|
||||||
|
<< '\n';
|
||||||
|
}
|
||||||
|
std::cerr << translate("All books searched.") << '\n';
|
||||||
|
}};
|
||||||
|
std::promise<bool> promise_status;
|
||||||
|
std::thread thread_status{print_status, promise_status.get_future()};
|
||||||
|
|
||||||
for (const auto &filepath : input_files)
|
for (const auto &filepath : input_files)
|
||||||
{
|
{
|
||||||
while (futurepool.size() >= max_threads)
|
while (futurepool.size() >= max_threads)
|
||||||
|
@ -219,11 +255,15 @@ int main(int argc, char *argv[])
|
||||||
DEBUGLOG << "Attempting to clean up threads";
|
DEBUGLOG << "Attempting to clean up threads";
|
||||||
futures_cleanup();
|
futures_cleanup();
|
||||||
}
|
}
|
||||||
|
if (return_code == EXIT_FATAL)
|
||||||
|
{
|
||||||
|
break;
|
||||||
|
}
|
||||||
futurepool.emplace_back(
|
futurepool.emplace_back(
|
||||||
std::async(std::launch::async, search_file, filepath));
|
std::async(std::launch::async, search_file, filepath));
|
||||||
DEBUGLOG << "Launched new thread";
|
DEBUGLOG << "Launched new thread";
|
||||||
|
|
||||||
if (!matches_all.empty() && !opts.json)
|
if (!matches_all.empty() && !opts.json && !opts.html)
|
||||||
{
|
{
|
||||||
output::print_matches(matches_all[0], opts,
|
output::print_matches(matches_all[0], opts,
|
||||||
input_files.size() == 1);
|
input_files.size() == 1);
|
||||||
|
@ -233,11 +273,21 @@ int main(int argc, char *argv[])
|
||||||
}
|
}
|
||||||
DEBUGLOG << "Waiting for remaining threads to finish";
|
DEBUGLOG << "Waiting for remaining threads to finish";
|
||||||
futures_cleanup(true);
|
futures_cleanup(true);
|
||||||
|
promise_status.set_value(true);
|
||||||
|
thread_status.join();
|
||||||
|
if (return_code == EXIT_FATAL)
|
||||||
|
{
|
||||||
|
return EXIT_FATAL;
|
||||||
|
}
|
||||||
|
|
||||||
if (opts.json)
|
if (opts.json)
|
||||||
{
|
{
|
||||||
output::json_all(matches_all);
|
output::json_all(matches_all);
|
||||||
}
|
}
|
||||||
|
else if (opts.html)
|
||||||
|
{
|
||||||
|
output::html_all(matches_all, opts);
|
||||||
|
}
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
for (const auto &matches : matches_all)
|
for (const auto &matches : matches_all)
|
||||||
|
|
|
@ -49,13 +49,19 @@ using std::cout;
|
||||||
|
|
||||||
options parse_options(int argc, char *argv[])
|
options parse_options(int argc, char *argv[])
|
||||||
{
|
{
|
||||||
po::options_description options_visible(translate("Available options"));
|
|
||||||
// clang-format off
|
// clang-format off
|
||||||
options_visible.add_options()
|
po::options_description options_general(translate("General options"));
|
||||||
|
options_general.add_options()
|
||||||
("help,h",
|
("help,h",
|
||||||
translate("Display this help and exit.").str().data())
|
translate("Display this help and exit.").str().data())
|
||||||
("version,V",
|
("version,V",
|
||||||
translate("Display version information and exit.").str().data())
|
translate("Display version information and exit.").str().data())
|
||||||
|
("debug",
|
||||||
|
translate("Enable debug output.").str().data())
|
||||||
|
;
|
||||||
|
|
||||||
|
po::options_description options_search(translate("Search options"));
|
||||||
|
options_search.add_options()
|
||||||
("basic-regexp,G",
|
("basic-regexp,G",
|
||||||
translate("PATTERN is a basic regular expression (default).")
|
translate("PATTERN is a basic regular expression (default).")
|
||||||
.str().data())
|
.str().data())
|
||||||
|
@ -66,14 +72,25 @@ options parse_options(int argc, char *argv[])
|
||||||
.str().data())
|
.str().data())
|
||||||
("perl-regexp,P",
|
("perl-regexp,P",
|
||||||
translate("PATTERN is a Perl regular expression.").str().data())
|
translate("PATTERN is a Perl regular expression.").str().data())
|
||||||
|
|
||||||
("ignore-case,i",
|
("ignore-case,i",
|
||||||
translate("Ignore case distinctions in pattern and data.")
|
translate("Ignore case distinctions in pattern and data.")
|
||||||
.str().data())
|
.str().data())
|
||||||
|
("raw,a",
|
||||||
|
translate("Do not clean up text before searching.").str().data())
|
||||||
|
("recursive,r",
|
||||||
|
translate("Read all files under each directory, recursively.")
|
||||||
|
.str().data())
|
||||||
|
("dereference-recursive,R",
|
||||||
|
translate("Read all files under each directory, recursively, "
|
||||||
|
"following symlinks.").str().data())
|
||||||
("regexp,e", po::value<std::vector<std::string>>()
|
("regexp,e", po::value<std::vector<std::string>>()
|
||||||
->value_name(translate("PATTERN"))->composing()->required(),
|
->value_name(translate("PATTERN"))->composing()->required(),
|
||||||
translate("Use additional PATTERN for matching.").str().data())
|
translate("Use additional PATTERN for matching.").str().data())
|
||||||
("raw,a",
|
;
|
||||||
translate("Do not clean up text before searching.").str().data())
|
|
||||||
|
po::options_description options_output(translate("Output options"));
|
||||||
|
options_output.add_options()
|
||||||
("context,C", po::value<std::uint64_t>()
|
("context,C", po::value<std::uint64_t>()
|
||||||
->value_name(translate("NUMBER"))->default_value(0),
|
->value_name(translate("NUMBER"))->default_value(0),
|
||||||
translate("Print NUMBER words of context around matches.")
|
translate("Print NUMBER words of context around matches.")
|
||||||
|
@ -83,18 +100,19 @@ options parse_options(int argc, char *argv[])
|
||||||
("no-filename",po::value<std::string>()->value_name(translate("WHICH")),
|
("no-filename",po::value<std::string>()->value_name(translate("WHICH")),
|
||||||
translate("Suppress the mentioning of file names on output. "
|
translate("Suppress the mentioning of file names on output. "
|
||||||
"WHICH is ‘filesystem’, ‘in-epub’ or ‘all’.").str().data())
|
"WHICH is ‘filesystem’, ‘in-epub’ or ‘all’.").str().data())
|
||||||
("recursive,r",
|
|
||||||
translate("Read all files under each directory, recursively.")
|
|
||||||
.str().data())
|
|
||||||
("dereference-recursive,R",
|
|
||||||
translate("Read all files under each directory, recursively, "
|
|
||||||
"following symlinks.") .str().data())
|
|
||||||
("ignore-archive-errors",
|
("ignore-archive-errors",
|
||||||
translate("Ignore errors about wrong file formats.") .str().data())
|
translate("Ignore errors about wrong file formats.").str().data())
|
||||||
("debug",
|
|
||||||
translate("Enable debug output.") .str().data())
|
|
||||||
("json",
|
("json",
|
||||||
translate("Output JSON instead of plain text.") .str().data())
|
translate("Output JSON instead of plain text.").str().data())
|
||||||
|
("html",
|
||||||
|
translate("Output HTML instead of plain text.").str().data())
|
||||||
|
("status",
|
||||||
|
translate("Output status message every STATUS-INTERVAL seconds.")
|
||||||
|
.str().data())
|
||||||
|
("status-interval", po::value<std::uint64_t>()
|
||||||
|
->value_name(translate("NUMBER"))->default_value(30),
|
||||||
|
translate("Set status message interval to NUMBER seconds.")
|
||||||
|
.str().data())
|
||||||
;
|
;
|
||||||
|
|
||||||
po::options_description options_hidden("Hidden options");
|
po::options_description options_hidden("Hidden options");
|
||||||
|
@ -103,6 +121,12 @@ options parse_options(int argc, char *argv[])
|
||||||
->value_name("FILE"), "Input file to search.")
|
->value_name("FILE"), "Input file to search.")
|
||||||
;
|
;
|
||||||
// clang-format on
|
// clang-format on
|
||||||
|
|
||||||
|
po::options_description options_visible;
|
||||||
|
options_visible.add(options_general)
|
||||||
|
.add(options_search)
|
||||||
|
.add(options_output);
|
||||||
|
|
||||||
po::options_description options_all("Allowed options");
|
po::options_description options_all("Allowed options");
|
||||||
options_all.add(options_visible).add(options_hidden);
|
options_all.add(options_visible).add(options_hidden);
|
||||||
|
|
||||||
|
@ -135,7 +159,7 @@ options parse_options(int argc, char *argv[])
|
||||||
|
|
||||||
if (vm.count("help") != 0)
|
if (vm.count("help") != 0)
|
||||||
{
|
{
|
||||||
cout << translate("Usage: epubgrep [OPTION]… PATTERN [FILE]…\n");
|
cout << translate("Usage: epubgrep [OPTION]… PATTERN FILE…\n");
|
||||||
cout << options_visible;
|
cout << options_visible;
|
||||||
cout << translate("\nYou can access the full manual "
|
cout << translate("\nYou can access the full manual "
|
||||||
"with `man epubgrep`.\n");
|
"with `man epubgrep`.\n");
|
||||||
|
@ -235,6 +259,9 @@ options parse_again(const po::variables_map &vm)
|
||||||
opts.ignore_archive_errors = vm.count("ignore-archive-errors") > 0;
|
opts.ignore_archive_errors = vm.count("ignore-archive-errors") > 0;
|
||||||
opts.debug = vm.count("debug") > 0;
|
opts.debug = vm.count("debug") > 0;
|
||||||
opts.json = vm.count("json") > 0;
|
opts.json = vm.count("json") > 0;
|
||||||
|
opts.html = vm.count("html") > 0;
|
||||||
|
opts.status = vm.count("status") > 0;
|
||||||
|
opts.status_interval = vm["status-interval"].as<std::uint64_t>();
|
||||||
|
|
||||||
if (vm.count("regexp") > 0)
|
if (vm.count("regexp") > 0)
|
||||||
{
|
{
|
||||||
|
|
|
@ -58,6 +58,9 @@ struct options
|
||||||
bool ignore_archive_errors{false};
|
bool ignore_archive_errors{false};
|
||||||
bool debug{false};
|
bool debug{false};
|
||||||
bool json{false};
|
bool json{false};
|
||||||
|
bool html{false};
|
||||||
|
bool status{false};
|
||||||
|
uint64_t status_interval{0};
|
||||||
|
|
||||||
//! For the debug output.
|
//! For the debug output.
|
||||||
friend std::ostream &operator<<(std::ostream &out, const options &opts);
|
friend std::ostream &operator<<(std::ostream &out, const options &opts);
|
||||||
|
|
153
src/output.cpp
153
src/output.cpp
|
@ -24,6 +24,7 @@
|
||||||
#include <nlohmann/json.hpp>
|
#include <nlohmann/json.hpp>
|
||||||
#include <termcolor/termcolor.hpp>
|
#include <termcolor/termcolor.hpp>
|
||||||
|
|
||||||
|
#include <cstdint>
|
||||||
#include <iostream>
|
#include <iostream>
|
||||||
#include <sstream>
|
#include <sstream>
|
||||||
|
|
||||||
|
@ -37,27 +38,22 @@ using std::cout;
|
||||||
void print_matches(const std::vector<search::match> &matches,
|
void print_matches(const std::vector<search::match> &matches,
|
||||||
const options::options &opts, bool single_file)
|
const options::options &opts, bool single_file)
|
||||||
{
|
{
|
||||||
fs::path last_epub;
|
if (!single_file && !opts.no_fn_fs)
|
||||||
|
{
|
||||||
|
if (!opts.nocolor)
|
||||||
|
{
|
||||||
|
cout << termcolor::yellow;
|
||||||
|
}
|
||||||
|
cout << format(translate(" In {0:s}: \n").str().c_str(),
|
||||||
|
fs::relative(matches[0].filepath_epub).c_str());
|
||||||
|
if (!opts.nocolor)
|
||||||
|
{
|
||||||
|
cout << termcolor::reset;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
for (const auto &match : matches)
|
for (const auto &match : matches)
|
||||||
{
|
{
|
||||||
if (!single_file && !opts.no_fn_fs)
|
|
||||||
{
|
|
||||||
if (match.filepath_epub != last_epub)
|
|
||||||
{
|
|
||||||
if (!opts.nocolor)
|
|
||||||
{
|
|
||||||
cout << termcolor::yellow;
|
|
||||||
}
|
|
||||||
cout << format(translate(" In {0:s}: \n").str(),
|
|
||||||
fs::relative(match.filepath_epub));
|
|
||||||
last_epub = match.filepath_epub;
|
|
||||||
if (!opts.nocolor)
|
|
||||||
{
|
|
||||||
cout << termcolor::reset;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
std::vector<std::string> metadata;
|
std::vector<std::string> metadata;
|
||||||
if (!opts.no_fn_epub)
|
if (!opts.no_fn_epub)
|
||||||
{
|
{
|
||||||
|
@ -82,22 +78,25 @@ void print_matches(const std::vector<search::match> &matches,
|
||||||
{
|
{
|
||||||
metadata.emplace_back("page " + match.page);
|
metadata.emplace_back("page " + match.page);
|
||||||
}
|
}
|
||||||
if (!opts.nocolor)
|
if (!metadata.empty())
|
||||||
{
|
{
|
||||||
cout << termcolor::italic;
|
if (!opts.nocolor)
|
||||||
}
|
|
||||||
for (const auto &part : metadata)
|
|
||||||
{
|
|
||||||
cout << part;
|
|
||||||
if (part != *(metadata.rbegin()))
|
|
||||||
{
|
{
|
||||||
cout << ", ";
|
cout << termcolor::italic;
|
||||||
|
}
|
||||||
|
for (const auto &part : metadata)
|
||||||
|
{
|
||||||
|
cout << part;
|
||||||
|
if (part != *(metadata.rbegin()))
|
||||||
|
{
|
||||||
|
cout << ", ";
|
||||||
|
}
|
||||||
|
}
|
||||||
|
cout << ": ";
|
||||||
|
if (!opts.nocolor)
|
||||||
|
{
|
||||||
|
cout << termcolor::reset;
|
||||||
}
|
}
|
||||||
}
|
|
||||||
cout << ": ";
|
|
||||||
if (!opts.nocolor)
|
|
||||||
{
|
|
||||||
cout << termcolor::reset;
|
|
||||||
}
|
}
|
||||||
cout << match.context.first;
|
cout << match.context.first;
|
||||||
if (!opts.nocolor)
|
if (!opts.nocolor)
|
||||||
|
@ -133,7 +132,95 @@ void json_all(const std::vector<std::vector<search::match>> &matches_all)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
std::cout << json.dump() << '\n';
|
cout << json.dump() << '\n';
|
||||||
|
}
|
||||||
|
|
||||||
|
void html_all(const std::vector<std::vector<search::match>> &matches_all,
|
||||||
|
const options::options &opts)
|
||||||
|
{
|
||||||
|
std::uint64_t count{1};
|
||||||
|
|
||||||
|
cout << "<!DOCTYPE html>\n";
|
||||||
|
// Translators: Replace “en” with your language code here.
|
||||||
|
cout << format(R"(<html lang="{0:s}">)", translate("en").str());
|
||||||
|
cout << "<head><title>epubgrep output</title>"
|
||||||
|
"<style>article { margin: 1em; }</style>"
|
||||||
|
"</head><body>\n\n";
|
||||||
|
|
||||||
|
for (const auto &matches : matches_all)
|
||||||
|
{
|
||||||
|
const auto identifier{
|
||||||
|
[&opts, count, &matches]
|
||||||
|
{
|
||||||
|
if (opts.no_fn_fs)
|
||||||
|
{
|
||||||
|
return format(translate("File {0:d}").str(), count);
|
||||||
|
}
|
||||||
|
return fs::relative(matches[0].filepath_epub).string();
|
||||||
|
}()};
|
||||||
|
|
||||||
|
// Start article, table and print table header.
|
||||||
|
cout << format(R"(<article aria-labelledby="file_{0:d}">)", count)
|
||||||
|
<< "\n <table>\n"
|
||||||
|
<< format(R"( <caption id="file_{0:d}">{1:s}</caption>)", count,
|
||||||
|
identifier)
|
||||||
|
<< '\n'
|
||||||
|
<< " <tr>\n";
|
||||||
|
if (!opts.no_fn_epub)
|
||||||
|
{
|
||||||
|
cout << format(R"( <th id="file_path_{0:d}">{1:s}</th>)",
|
||||||
|
count,
|
||||||
|
translate("File path (in EPUB file)").str().c_str())
|
||||||
|
<< '\n';
|
||||||
|
}
|
||||||
|
cout << format(R"( <th id="headline_{0:d}">{1:s}</th>)", count,
|
||||||
|
translate("Last headline").str().c_str())
|
||||||
|
<< '\n'
|
||||||
|
<< format(R"( <th id="page_{0:d}">{1:s}</th>)", count,
|
||||||
|
translate("Page number").str().c_str())
|
||||||
|
<< '\n'
|
||||||
|
<< format(R"( <th id="match_{0:d}">{1:s}</th>)", count,
|
||||||
|
translate("Match").str().c_str())
|
||||||
|
<< "\n </tr>\n";
|
||||||
|
|
||||||
|
for (const auto &match : matches)
|
||||||
|
{
|
||||||
|
const auto lang{[&match]
|
||||||
|
{
|
||||||
|
if (!match.language.empty())
|
||||||
|
{
|
||||||
|
return format(R"( lang="{0:s}")",
|
||||||
|
match.language);
|
||||||
|
}
|
||||||
|
return std::string{};
|
||||||
|
}()};
|
||||||
|
cout << " <tr>\n";
|
||||||
|
if (!opts.no_fn_epub)
|
||||||
|
{
|
||||||
|
cout << format(
|
||||||
|
R"( <td headers="file_path_{0:d}">{1:s}</td>)", count,
|
||||||
|
match.filepath_inside)
|
||||||
|
<< '\n';
|
||||||
|
}
|
||||||
|
cout << format(
|
||||||
|
R"( <td headers="headline_{0:d}"{1:s}>{2:s}</td>)", count,
|
||||||
|
lang, match.headline)
|
||||||
|
<< '\n';
|
||||||
|
cout << format(R"( <td headers="page_{0:d}">{1:s}</td>)",
|
||||||
|
count, match.page)
|
||||||
|
<< '\n';
|
||||||
|
cout << format(R"( <td headers="match_{0:d}"{1:s}>{2:s})"
|
||||||
|
R"(<strong>{3:s}</strong>{4:s}</td>)",
|
||||||
|
count, lang, match.context.first, match.text,
|
||||||
|
match.context.second)
|
||||||
|
<< '\n';
|
||||||
|
cout << " </tr>\n";
|
||||||
|
}
|
||||||
|
cout << " </table>\n</article>\n\n";
|
||||||
|
++count;
|
||||||
|
}
|
||||||
|
|
||||||
|
cout << "</body></html>\n";
|
||||||
}
|
}
|
||||||
|
|
||||||
} // namespace epubgrep::output
|
} // namespace epubgrep::output
|
||||||
|
|
|
@ -25,11 +25,17 @@
|
||||||
namespace epubgrep::output
|
namespace epubgrep::output
|
||||||
{
|
{
|
||||||
|
|
||||||
|
// Print the matches of an EPUB.
|
||||||
void print_matches(const std::vector<search::match> &matches,
|
void print_matches(const std::vector<search::match> &matches,
|
||||||
const options::options &opts, bool single_file);
|
const options::options &opts, bool single_file);
|
||||||
|
|
||||||
|
//! Print all matches as JSON.
|
||||||
void json_all(const std::vector<std::vector<search::match>> &matches_all);
|
void json_all(const std::vector<std::vector<search::match>> &matches_all);
|
||||||
|
|
||||||
|
//! Print all matches as HTML.
|
||||||
|
void html_all(const std::vector<std::vector<search::match>> &matches_all,
|
||||||
|
const options::options &opts);
|
||||||
|
|
||||||
} // namespace epubgrep::output
|
} // namespace epubgrep::output
|
||||||
|
|
||||||
#endif // EPUBGREP_OUTPUT_HPP
|
#endif // EPUBGREP_OUTPUT_HPP
|
||||||
|
|
169
src/search.cpp
169
src/search.cpp
|
@ -16,6 +16,7 @@
|
||||||
|
|
||||||
#include "search.hpp"
|
#include "search.hpp"
|
||||||
|
|
||||||
|
#include "book.hpp"
|
||||||
#include "fs-compat.hpp"
|
#include "fs-compat.hpp"
|
||||||
#include "helpers.hpp"
|
#include "helpers.hpp"
|
||||||
#include "log.hpp"
|
#include "log.hpp"
|
||||||
|
@ -27,6 +28,8 @@
|
||||||
|
|
||||||
#include <algorithm>
|
#include <algorithm>
|
||||||
#include <array>
|
#include <array>
|
||||||
|
#include <iterator>
|
||||||
|
#include <memory>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include <string_view>
|
#include <string_view>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
@ -41,8 +44,8 @@ std::vector<match> search(const fs::path &filepath,
|
||||||
const std::string_view regex, const settings &opts)
|
const std::string_view regex, const settings &opts)
|
||||||
{
|
{
|
||||||
LOG(log::sev::info)
|
LOG(log::sev::info)
|
||||||
<< format(R"(Starting search in {0:s} using regex "{1:s}")", filepath,
|
<< format(R"(Starting search in {0:s} using regex "{1:s}")",
|
||||||
regex);
|
filepath.c_str(), regex);
|
||||||
boost::regex::flag_type flags{};
|
boost::regex::flag_type flags{};
|
||||||
|
|
||||||
switch (opts.regex)
|
switch (opts.regex)
|
||||||
|
@ -71,119 +74,37 @@ std::vector<match> search(const fs::path &filepath,
|
||||||
|
|
||||||
const boost::regex re(regex.data(), flags);
|
const boost::regex re(regex.data(), flags);
|
||||||
std::vector<match> matches;
|
std::vector<match> matches;
|
||||||
std::vector<string> epub_filepaths{[&opts, &filepath]
|
auto book{book::read(filepath, opts.raw)};
|
||||||
{
|
for (const auto &file : book.files)
|
||||||
if (!opts.raw)
|
|
||||||
{
|
|
||||||
return zip::list_spine(filepath);
|
|
||||||
}
|
|
||||||
return zip::list(filepath);
|
|
||||||
}()};
|
|
||||||
|
|
||||||
for (const auto &entry : epub_filepaths)
|
|
||||||
{
|
{
|
||||||
DEBUGLOG << "Processing " << entry;
|
const auto &doc{file.second};
|
||||||
auto document{zip::read_file(filepath, entry)};
|
string::const_iterator begin{doc.text->begin()};
|
||||||
if (!opts.raw)
|
string::const_iterator end{doc.text->end()};
|
||||||
{
|
auto begin_text{begin};
|
||||||
cleanup_text(document);
|
|
||||||
document = helpers::unescape_html(document);
|
|
||||||
}
|
|
||||||
|
|
||||||
string::const_iterator begin{document.begin()};
|
|
||||||
string::const_iterator end{document.end()};
|
|
||||||
boost::match_results<string::const_iterator> match_result;
|
boost::match_results<string::const_iterator> match_result;
|
||||||
string last_headline;
|
|
||||||
string last_page;
|
|
||||||
|
|
||||||
while (boost::regex_search(begin, end, match_result, re,
|
while (boost::regex_search(begin, end, match_result, re,
|
||||||
boost::match_default))
|
boost::match_default))
|
||||||
{
|
{
|
||||||
match match; // FIXME: Rename variable or struct.
|
match match; // FIXME: Rename variable or struct.
|
||||||
match.filepath_epub = filepath;
|
match.filepath_epub = filepath;
|
||||||
match.filepath_inside = entry;
|
match.filepath_inside = file.first;
|
||||||
match.text = match_result[0];
|
match.text = match_result[0];
|
||||||
match.context = context(match_result, opts.context);
|
match.context = context(match_result, opts.context);
|
||||||
const auto current_headline{headline(match_result.prefix().str())};
|
const auto pos = static_cast<size_t>(
|
||||||
if (!current_headline.empty())
|
std::distance(begin_text, match_result[0].begin()));
|
||||||
{
|
match.headline = headline(doc, pos);
|
||||||
last_headline = current_headline;
|
match.page = page(doc, pos);
|
||||||
}
|
match.language = doc.language; // FIXME: Get language of match.
|
||||||
match.headline = last_headline;
|
|
||||||
const auto current_page{page(match_result.prefix().str())};
|
|
||||||
if (!current_page.empty())
|
|
||||||
{
|
|
||||||
last_page = current_page;
|
|
||||||
}
|
|
||||||
match.page = last_page;
|
|
||||||
|
|
||||||
matches.emplace_back(match);
|
matches.emplace_back(match);
|
||||||
begin = match_result[0].second;
|
begin = match_result[0].end();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
return matches;
|
return matches;
|
||||||
}
|
}
|
||||||
|
|
||||||
void cleanup_text(string &text)
|
|
||||||
{
|
|
||||||
static const boost::regex re_header_start{"<[hH][1-6]"};
|
|
||||||
static const boost::regex re_header_end{"</[hH][1-6]"};
|
|
||||||
static const boost::regex re_pagebreak{".+pagebreak.+(title|aria-label)"
|
|
||||||
"=\"([[:alnum:]]+)\".*"};
|
|
||||||
|
|
||||||
size_t pos{};
|
|
||||||
while ((pos = text.find('<', pos)) != string::npos)
|
|
||||||
{
|
|
||||||
// Mark headlines. We need them later on.
|
|
||||||
string replacement;
|
|
||||||
if (boost::regex_match(text.substr(pos, 3), re_header_start))
|
|
||||||
{
|
|
||||||
replacement = "<H>";
|
|
||||||
}
|
|
||||||
else if (boost::regex_match(text.substr(pos, 4), re_header_end))
|
|
||||||
{
|
|
||||||
replacement = "</H>";
|
|
||||||
}
|
|
||||||
else if (text.substr(pos, 6) == "<span ")
|
|
||||||
{
|
|
||||||
auto endpos{text.find('>')};
|
|
||||||
boost::match_results<const char *> match;
|
|
||||||
if (boost::regex_search(text.substr(pos, endpos).data(), match,
|
|
||||||
re_pagebreak))
|
|
||||||
{
|
|
||||||
replacement = "<PAGE " + match[2] + ">";
|
|
||||||
}
|
|
||||||
}
|
|
||||||
else if (text.substr(pos, 7) == "<style "
|
|
||||||
|| text.substr(pos, 8) == "<script ")
|
|
||||||
{
|
|
||||||
pos = text.find('>', pos) + 1;
|
|
||||||
}
|
|
||||||
|
|
||||||
text.replace(pos, text.find('>', pos) + 1 - pos, replacement);
|
|
||||||
pos += replacement.length();
|
|
||||||
}
|
|
||||||
|
|
||||||
pos = 0;
|
|
||||||
while ((pos = text.find('\r', pos)) != string::npos)
|
|
||||||
{
|
|
||||||
text.erase(pos, 1);
|
|
||||||
}
|
|
||||||
|
|
||||||
pos = 0;
|
|
||||||
while ((pos = text.find_first_of("\n\t", pos)) != string::npos)
|
|
||||||
{
|
|
||||||
text.replace(pos, 1, " ");
|
|
||||||
}
|
|
||||||
|
|
||||||
pos = 0;
|
|
||||||
while ((pos = text.find(" ", pos)) != string::npos)
|
|
||||||
{
|
|
||||||
text.replace(pos, 2, " ");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
match_context context(const boost::match_results<string::const_iterator> &match,
|
match_context context(const boost::match_results<string::const_iterator> &match,
|
||||||
std::uint64_t words)
|
std::uint64_t words)
|
||||||
{
|
{
|
||||||
|
@ -212,12 +133,10 @@ match_context context(const boost::match_results<string::const_iterator> &match,
|
||||||
pos_before = std::find_first_of(pos_before, rend_before,
|
pos_before = std::find_first_of(pos_before, rend_before,
|
||||||
whitespace.begin(),
|
whitespace.begin(),
|
||||||
whitespace.end());
|
whitespace.end());
|
||||||
if (pos_before != rend_before)
|
while (pos_before != rend_before
|
||||||
|
&& helpers::is_whitespace(*pos_before))
|
||||||
{
|
{
|
||||||
while (helpers::is_whitespace(*pos_before))
|
++pos_before;
|
||||||
{
|
|
||||||
++pos_before;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -226,20 +145,17 @@ match_context context(const boost::match_results<string::const_iterator> &match,
|
||||||
pos_after = std::find_first_of(pos_after, end_after,
|
pos_after = std::find_first_of(pos_after, end_after,
|
||||||
whitespace.begin(),
|
whitespace.begin(),
|
||||||
whitespace.end());
|
whitespace.end());
|
||||||
if (pos_after != end_after)
|
while (pos_after != end_after && helpers::is_whitespace(*pos_after))
|
||||||
{
|
{
|
||||||
while (helpers::is_whitespace(*pos_after))
|
++pos_after;
|
||||||
{
|
|
||||||
++pos_after;
|
|
||||||
}
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
words -= 1;
|
words -= 1;
|
||||||
}
|
}
|
||||||
|
|
||||||
const std::string before_reversed(rbegin_before, pos_before);
|
const string before_reversed(rbegin_before, pos_before);
|
||||||
string before(before_reversed.rbegin(), before_reversed.rend());
|
string before(before_reversed.rbegin(), before_reversed.rend());
|
||||||
std::string after(begin_after, pos_after);
|
string after(begin_after, pos_after);
|
||||||
while (helpers::is_whitespace(*before.begin()))
|
while (helpers::is_whitespace(*before.begin()))
|
||||||
{
|
{
|
||||||
before.erase(0, 1);
|
before.erase(0, 1);
|
||||||
|
@ -252,39 +168,4 @@ match_context context(const boost::match_results<string::const_iterator> &match,
|
||||||
return {before, after};
|
return {before, after};
|
||||||
}
|
}
|
||||||
|
|
||||||
string headline(const std::string_view prefix)
|
|
||||||
{
|
|
||||||
size_t pos{prefix.length()};
|
|
||||||
if ((pos = prefix.rfind("<H>", pos)) != std::string_view::npos)
|
|
||||||
{
|
|
||||||
pos += 3;
|
|
||||||
string result{prefix.substr(pos, prefix.find('<', pos) - pos)};
|
|
||||||
|
|
||||||
while (helpers::is_whitespace(*result.begin()))
|
|
||||||
{
|
|
||||||
result.erase(0, 1);
|
|
||||||
}
|
|
||||||
while (helpers::is_whitespace(*result.rbegin()))
|
|
||||||
{
|
|
||||||
result.erase(result.size() - 1);
|
|
||||||
}
|
|
||||||
|
|
||||||
return result;
|
|
||||||
}
|
|
||||||
|
|
||||||
return {};
|
|
||||||
}
|
|
||||||
|
|
||||||
string page(const std::string_view prefix)
|
|
||||||
{
|
|
||||||
size_t pos{prefix.length()};
|
|
||||||
while ((pos = prefix.rfind("<PAGE ", pos)) != std::string_view::npos)
|
|
||||||
{
|
|
||||||
pos += 6;
|
|
||||||
return string{prefix.substr(pos, prefix.find('>', pos) - pos)};
|
|
||||||
}
|
|
||||||
|
|
||||||
return {};
|
|
||||||
}
|
|
||||||
|
|
||||||
} // namespace epubgrep::search
|
} // namespace epubgrep::search
|
||||||
|
|
|
@ -22,7 +22,9 @@
|
||||||
|
|
||||||
#include <boost/regex.hpp>
|
#include <boost/regex.hpp>
|
||||||
|
|
||||||
|
#include <cstddef>
|
||||||
#include <cstdint>
|
#include <cstdint>
|
||||||
|
#include <map>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include <string_view>
|
#include <string_view>
|
||||||
#include <utility>
|
#include <utility>
|
||||||
|
@ -41,7 +43,8 @@ struct match
|
||||||
std::string filepath_inside; //!< The file path of the matched line.
|
std::string filepath_inside; //!< The file path of the matched line.
|
||||||
std::string headline; //!< The last headline, if available.
|
std::string headline; //!< The last headline, if available.
|
||||||
std::string page; //!< The page number, if available.
|
std::string page; //!< The page number, if available.
|
||||||
};
|
std::string language; //!< Match language.
|
||||||
|
} __attribute__((aligned(128)));
|
||||||
|
|
||||||
struct settings
|
struct settings
|
||||||
{
|
{
|
||||||
|
@ -50,27 +53,25 @@ struct settings
|
||||||
bool ignore_case{false};
|
bool ignore_case{false};
|
||||||
bool raw{false};
|
bool raw{false};
|
||||||
std::uint64_t context{0};
|
std::uint64_t context{0};
|
||||||
};
|
} __attribute__((aligned(16)));
|
||||||
|
|
||||||
|
struct file_in_epub
|
||||||
|
{
|
||||||
|
std::string text;
|
||||||
|
std::map<size_t, std::string> headlines;
|
||||||
|
std::map<size_t, std::string> pages;
|
||||||
|
} __attribute__((aligned(128)));
|
||||||
|
|
||||||
//! Search file, return matches.
|
//! Search file, return matches.
|
||||||
[[nodiscard]] std::vector<match> search(const fs::path &filepath,
|
[[nodiscard]] std::vector<match> search(const fs::path &filepath,
|
||||||
std::string_view regex,
|
std::string_view regex,
|
||||||
const settings &opts);
|
const settings &opts);
|
||||||
|
|
||||||
//! Strip HTML, remove newlines, condense spaces.
|
|
||||||
void cleanup_text(std::string &text);
|
|
||||||
|
|
||||||
//! Return words before and after the match.
|
//! Return words before and after the match.
|
||||||
[[nodiscard]] match_context
|
[[nodiscard]] match_context
|
||||||
context(const boost::match_results<std::string::const_iterator> &match,
|
context(const boost::match_results<std::string::const_iterator> &match,
|
||||||
std::uint64_t words);
|
std::uint64_t words);
|
||||||
|
|
||||||
//! Return last headline if possible.
|
|
||||||
[[nodiscard]] std::string headline(std::string_view prefix);
|
|
||||||
|
|
||||||
//! Return current page if possible.
|
|
||||||
[[nodiscard]] std::string page(std::string_view prefix);
|
|
||||||
|
|
||||||
} // namespace epubgrep::search
|
} // namespace epubgrep::search
|
||||||
|
|
||||||
#endif // EPUBGREP_SEARCH_HPP
|
#endif // EPUBGREP_SEARCH_HPP
|
||||||
|
|
97
src/zip.cpp
97
src/zip.cpp
|
@ -25,7 +25,6 @@
|
||||||
#include <boost/locale/message.hpp>
|
#include <boost/locale/message.hpp>
|
||||||
#include <fmt/format.h>
|
#include <fmt/format.h>
|
||||||
#include <fmt/ostream.h> // For compatibility with fmt 4.
|
#include <fmt/ostream.h> // For compatibility with fmt 4.
|
||||||
#include <pugixml.hpp>
|
|
||||||
|
|
||||||
#include <cstdlib>
|
#include <cstdlib>
|
||||||
#include <cstring>
|
#include <cstring>
|
||||||
|
@ -56,8 +55,8 @@ std::vector<std::string> list(const fs::path &filepath)
|
||||||
<< format(translate("File in {0:s} is damaged. "
|
<< format(translate("File in {0:s} is damaged. "
|
||||||
"Skipping in-EPUB file.\n")
|
"Skipping in-EPUB file.\n")
|
||||||
.str()
|
.str()
|
||||||
.data(),
|
.c_str(),
|
||||||
filepath);
|
filepath.c_str());
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
toc.emplace_back(in_epub_filepath);
|
toc.emplace_back(in_epub_filepath);
|
||||||
|
@ -85,7 +84,7 @@ std::string read_file(const fs::path &filepath, std::string_view entry_path)
|
||||||
"Skipping in-EPUB file.\n")
|
"Skipping in-EPUB file.\n")
|
||||||
.str()
|
.str()
|
||||||
.data(),
|
.data(),
|
||||||
filepath);
|
filepath.c_str());
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
if (std::strcmp(path, entry_path.data()) == 0)
|
if (std::strcmp(path, entry_path.data()) == 0)
|
||||||
|
@ -100,9 +99,9 @@ std::string read_file(const fs::path &filepath, std::string_view entry_path)
|
||||||
{
|
{
|
||||||
close_file(zipfile, filepath);
|
close_file(zipfile, filepath);
|
||||||
|
|
||||||
throw exception{
|
throw exception{format(
|
||||||
format(translate("Could not read {0:s} in {1:s}.").str(),
|
translate("Could not read {0:s} in {1:s}.").str().c_str(),
|
||||||
entry_path, filepath.string())};
|
entry_path, filepath.string())};
|
||||||
}
|
}
|
||||||
|
|
||||||
close_file(zipfile, filepath);
|
close_file(zipfile, filepath);
|
||||||
|
@ -116,7 +115,7 @@ std::string read_file(const fs::path &filepath, std::string_view entry_path)
|
||||||
|
|
||||||
if (entry_path == "META-INF/container.xml")
|
if (entry_path == "META-INF/container.xml")
|
||||||
{ // File is probably not an EPUB.
|
{ // File is probably not an EPUB.
|
||||||
exception e{format(translate("{0:s} not found in {1:s}.").str(),
|
exception e{format(translate("{0:s} not found in {1:s}.").str().c_str(),
|
||||||
entry_path, filepath.string())};
|
entry_path, filepath.string())};
|
||||||
e.code = 1;
|
e.code = 1;
|
||||||
throw exception{e};
|
throw exception{e};
|
||||||
|
@ -146,7 +145,7 @@ struct archive *open_file(const fs::path &filepath)
|
||||||
{
|
{
|
||||||
close_file(zipfile, filepath);
|
close_file(zipfile, filepath);
|
||||||
|
|
||||||
exception e{format(translate("Could not open {0:s}.").str(),
|
exception e{format(translate("Could not open {0:s}.").str().c_str(),
|
||||||
filepath.string())};
|
filepath.string())};
|
||||||
e.code = 1;
|
e.code = 1;
|
||||||
throw exception{e};
|
throw exception{e};
|
||||||
|
@ -160,84 +159,10 @@ void close_file(struct archive *zipfile, const fs::path &filepath)
|
||||||
auto result{archive_read_free(zipfile)};
|
auto result{archive_read_free(zipfile)};
|
||||||
if (result != ARCHIVE_OK)
|
if (result != ARCHIVE_OK)
|
||||||
{
|
{
|
||||||
throw exception{format(translate("Could not close {0:s}.").str(),
|
throw exception{
|
||||||
filepath.string())};
|
format(translate("Could not close {0:s}.").str().c_str(),
|
||||||
|
filepath.string())};
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
std::vector<std::string> list_spine(const fs::path &filepath)
|
|
||||||
{
|
|
||||||
const fs::path opf_file_path{
|
|
||||||
[&filepath]
|
|
||||||
{
|
|
||||||
pugi::xml_document xml;
|
|
||||||
const std::string container{
|
|
||||||
read_file(filepath, "META-INF/container.xml")};
|
|
||||||
const auto result{xml.load_buffer(&container[0], container.size())};
|
|
||||||
if (result)
|
|
||||||
{
|
|
||||||
return xml.child("container")
|
|
||||||
.child("rootfiles")
|
|
||||||
.first_child()
|
|
||||||
.attribute("full-path")
|
|
||||||
.value();
|
|
||||||
}
|
|
||||||
LOG(log::sev::error) << result.description() << '\n';
|
|
||||||
|
|
||||||
return "";
|
|
||||||
}()};
|
|
||||||
|
|
||||||
std::vector<std::string> spine_filepaths;
|
|
||||||
if (!opf_file_path.empty())
|
|
||||||
{
|
|
||||||
DEBUGLOG << "Parsing " << opf_file_path;
|
|
||||||
pugi::xml_document xml;
|
|
||||||
const std::string opf_file{read_file(filepath, opf_file_path.string())};
|
|
||||||
const auto result{xml.load_buffer(&opf_file[0], opf_file.size())};
|
|
||||||
if (result)
|
|
||||||
{
|
|
||||||
auto manifest{xml.child("package").child("manifest")};
|
|
||||||
if (manifest == nullptr)
|
|
||||||
{
|
|
||||||
manifest = xml.child("opf:package").child("opf:manifest");
|
|
||||||
}
|
|
||||||
auto spine{xml.child("package").child("spine")};
|
|
||||||
if (spine == nullptr)
|
|
||||||
{
|
|
||||||
spine = xml.child("opf:package").child("opf:spine");
|
|
||||||
}
|
|
||||||
|
|
||||||
for (const auto &itemref : spine)
|
|
||||||
{
|
|
||||||
const auto &idref{itemref.attribute("idref").value()};
|
|
||||||
const auto &item{manifest.find_child_by_attribute("id", idref)};
|
|
||||||
auto href{helpers::urldecode(item.attribute("href").value())};
|
|
||||||
if (href[0] != '/')
|
|
||||||
{
|
|
||||||
href = (opf_file_path.parent_path() /= href);
|
|
||||||
}
|
|
||||||
DEBUGLOG << "Found in spine: " << href;
|
|
||||||
spine_filepaths.emplace_back(href);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
LOG(log::sev::error) << "XML: " << result.description() << '\n';
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
if (opf_file_path.empty() || spine_filepaths.empty())
|
|
||||||
{
|
|
||||||
LOG(log::sev::error)
|
|
||||||
<< format(translate("{0:s} is damaged. Could not read spine. "
|
|
||||||
"Skipping file.\n")
|
|
||||||
.str()
|
|
||||||
.data(),
|
|
||||||
filepath);
|
|
||||||
return {};
|
|
||||||
}
|
|
||||||
|
|
||||||
return spine_filepaths;
|
|
||||||
}
|
|
||||||
|
|
||||||
} // namespace epubgrep::zip
|
} // namespace epubgrep::zip
|
||||||
|
|
|
@ -43,9 +43,6 @@ namespace epubgrep::zip
|
||||||
//! Close zip file.
|
//! Close zip file.
|
||||||
void close_file(struct archive *zipfile, const fs::path &filepath);
|
void close_file(struct archive *zipfile, const fs::path &filepath);
|
||||||
|
|
||||||
//! Returns the files in the EPUB “spine” (all pages that are actually text).
|
|
||||||
[[nodiscard]] std::vector<std::string> list_spine(const fs::path &filepath);
|
|
||||||
|
|
||||||
//! It's std::runtime_error, but with another name.
|
//! It's std::runtime_error, but with another name.
|
||||||
class exception : public std::runtime_error
|
class exception : public std::runtime_error
|
||||||
{
|
{
|
||||||
|
|
|
@ -1,5 +1,3 @@
|
||||||
include(CTest)
|
|
||||||
|
|
||||||
file(GLOB sources_tests CONFIGURE_DEPENDS test_*.cpp)
|
file(GLOB sources_tests CONFIGURE_DEPENDS test_*.cpp)
|
||||||
file(COPY "test.zip" DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
|
file(COPY "test.zip" DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
|
||||||
file(COPY "test.epub2" DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
|
file(COPY "test.epub2" DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
|
||||||
|
@ -7,11 +5,16 @@ file(COPY "test.epub3" DESTINATION ${CMAKE_CURRENT_BINARY_DIR})
|
||||||
|
|
||||||
find_package(Catch2 CONFIG)
|
find_package(Catch2 CONFIG)
|
||||||
|
|
||||||
if(Catch2_FOUND) # Catch 2.x
|
if(Catch2_FOUND) # Catch 2.x / 3.x
|
||||||
include(Catch)
|
include(Catch)
|
||||||
add_executable(all_tests main.cpp ${sources_tests})
|
add_executable(all_tests main.cpp ${sources_tests})
|
||||||
target_link_libraries(all_tests
|
if(TARGET Catch2::Catch2WithMain) # Catch 3.x
|
||||||
PRIVATE Catch2::Catch2 ${PROJECT_NAME}_lib)
|
target_link_libraries(all_tests
|
||||||
|
PRIVATE Catch2::Catch2WithMain ${PROJECT_NAME}_lib)
|
||||||
|
else() # Catch 2.x
|
||||||
|
target_link_libraries(all_tests
|
||||||
|
PRIVATE Catch2::Catch2 ${PROJECT_NAME}_lib)
|
||||||
|
endif()
|
||||||
target_include_directories(all_tests PRIVATE "/usr/include/catch2")
|
target_include_directories(all_tests PRIVATE "/usr/include/catch2")
|
||||||
catch_discover_tests(all_tests EXTRA_ARGS "${EXTRA_TEST_ARGS}")
|
catch_discover_tests(all_tests EXTRA_ARGS "${EXTRA_TEST_ARGS}")
|
||||||
else() # Catch 1.x
|
else() # Catch 1.x
|
||||||
|
|
|
@ -1,3 +1,8 @@
|
||||||
#define CATCH_CONFIG_MAIN
|
#define CATCH_CONFIG_MAIN
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
|
@ -1,7 +1,12 @@
|
||||||
#include "fs-compat.hpp"
|
#include "fs-compat.hpp"
|
||||||
#include "helpers.hpp"
|
#include "helpers.hpp"
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <array>
|
#include <array>
|
||||||
#include <exception>
|
#include <exception>
|
||||||
|
|
|
@ -2,7 +2,12 @@
|
||||||
#include "options.hpp"
|
#include "options.hpp"
|
||||||
#include "search.hpp"
|
#include "search.hpp"
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <clocale>
|
#include <clocale>
|
||||||
#include <exception>
|
#include <exception>
|
||||||
|
@ -53,7 +58,7 @@ SCENARIO("Searching EPUB files works")
|
||||||
{
|
{
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
opts.raw = 1;
|
opts.raw = true;
|
||||||
opts.context = 1;
|
opts.context = 1;
|
||||||
matches = epubgrep::search::search(epubfile, "href", opts);
|
matches = epubgrep::search::search(epubfile, "href", opts);
|
||||||
}
|
}
|
||||||
|
@ -88,8 +93,7 @@ SCENARIO("Searching EPUB files works")
|
||||||
GIVEN("Our test EPUB3 file")
|
GIVEN("Our test EPUB3 file")
|
||||||
{
|
{
|
||||||
fs::path epubfile{"test.epub3"};
|
fs::path epubfile{"test.epub3"};
|
||||||
std::setlocale(LC_CTYPE,
|
std::setlocale(LC_CTYPE, ""); // Needed for utf-8 support in libarchive.
|
||||||
""); // Needed for utf-8 support in libarchive.
|
|
||||||
bool exception{false};
|
bool exception{false};
|
||||||
|
|
||||||
REQUIRE(fs::exists(epubfile));
|
REQUIRE(fs::exists(epubfile));
|
||||||
|
@ -128,7 +132,7 @@ SCENARIO("Searching EPUB files works")
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
opts.raw = true;
|
opts.raw = true;
|
||||||
opts.context = true;
|
opts.context = 1;
|
||||||
matches = epubgrep::search::search(epubfile, "href", opts);
|
matches = epubgrep::search::search(epubfile, "href", opts);
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
|
@ -161,6 +165,32 @@ SCENARIO("Searching EPUB files works")
|
||||||
R"(media-type="application/xhtml+xml")");
|
R"(media-type="application/xhtml+xml")");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
WHEN("We search for for a phrase at the beginning of the file "
|
||||||
|
"and specify a very high context")
|
||||||
|
{
|
||||||
|
try
|
||||||
|
{
|
||||||
|
opts.context = 69069;
|
||||||
|
matches = epubgrep::search::search(epubfile, "Test for",
|
||||||
|
opts);
|
||||||
|
}
|
||||||
|
catch (const std::exception &)
|
||||||
|
{
|
||||||
|
exception = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
THEN("No exception is thrown")
|
||||||
|
AND_THEN("It returns the match correctly")
|
||||||
|
{
|
||||||
|
REQUIRE_FALSE(exception);
|
||||||
|
REQUIRE(matches.at(0).filepath_inside == "start.xhtml");
|
||||||
|
REQUIRE(matches.at(0).text == "Test for");
|
||||||
|
REQUIRE(matches.at(0).headline.empty());
|
||||||
|
REQUIRE(matches.at(0).context.first.empty());
|
||||||
|
REQUIRE(*matches.at(0).context.second.rbegin() == '.');
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
|
@ -1,7 +1,13 @@
|
||||||
|
#include "book.hpp"
|
||||||
#include "fs-compat.hpp"
|
#include "fs-compat.hpp"
|
||||||
#include "search.hpp"
|
#include "search.hpp"
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <clocale>
|
#include <clocale>
|
||||||
#include <exception>
|
#include <exception>
|
||||||
|
@ -26,7 +32,7 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = "Moss";
|
text = "Moss";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
text = epubgrep::book::process_page(text).text_cleaned;
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -46,7 +52,7 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = "💖\r\r🦝";
|
text = "💖\r\r🦝";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
text = epubgrep::book::process_page(text).text_cleaned;
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -54,7 +60,7 @@ SCENARIO("Searching helpers work as intended")
|
||||||
}
|
}
|
||||||
|
|
||||||
THEN("No exception is thrown")
|
THEN("No exception is thrown")
|
||||||
AND_THEN("The \\r are removed unchanged")
|
AND_THEN("The \\r are removed")
|
||||||
{
|
{
|
||||||
REQUIRE_FALSE(exception);
|
REQUIRE_FALSE(exception);
|
||||||
REQUIRE(text == "💖🦝");
|
REQUIRE(text == "💖🦝");
|
||||||
|
@ -66,7 +72,7 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = "Moss\n\n\n\n\n\nis good.";
|
text = "Moss\n\n\n\n\n\nis good.";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
text = epubgrep::book::process_page(text).text_cleaned;
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -91,8 +97,8 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = "… <h3>Soup</h3> …";
|
text = "… <h3>Soup</h3> …";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
auto file{epubgrep::book::process_page(text)};
|
||||||
text = epubgrep::search::headline(text);
|
text = epubgrep::book::headline(file, text.size());
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -113,8 +119,8 @@ SCENARIO("Searching helpers work as intended")
|
||||||
"road to nowhere</h2> …";
|
"road to nowhere</h2> …";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
auto file{epubgrep::book::process_page(text)};
|
||||||
text = epubgrep::search::headline(text);
|
text = epubgrep::book::headline(file, text.size());
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -134,8 +140,8 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = "<html><hr>The long<section>road to nowhere</section>";
|
text = "<html><hr>The long<section>road to nowhere</section>";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
auto file{epubgrep::book::process_page(text)};
|
||||||
text = epubgrep::search::headline(text);
|
text = epubgrep::book::headline(file, text.size());
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -160,8 +166,8 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = R"(… <span epub:type="pagebreak" … title="69"/> …)";
|
text = R"(… <span epub:type="pagebreak" … title="69"/> …)";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
auto file{epubgrep::book::process_page(text)};
|
||||||
text = epubgrep::search::page(text);
|
text = epubgrep::book::page(file, text.size());
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
@ -181,8 +187,8 @@ SCENARIO("Searching helpers work as intended")
|
||||||
text = R"(… <span role="doc-pagebreak" … aria-label="69"/> …)";
|
text = R"(… <span role="doc-pagebreak" … aria-label="69"/> …)";
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
epubgrep::search::cleanup_text(text);
|
auto file{epubgrep::book::process_page(text)};
|
||||||
text = epubgrep::search::page(text);
|
text = epubgrep::book::page(file, text.size());
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &)
|
||||||
{
|
{
|
||||||
|
|
|
@ -2,10 +2,16 @@
|
||||||
#include "options.hpp"
|
#include "options.hpp"
|
||||||
#include "search.hpp"
|
#include "search.hpp"
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <clocale>
|
#include <clocale>
|
||||||
#include <exception>
|
#include <exception>
|
||||||
|
#include <iostream>
|
||||||
#include <string>
|
#include <string>
|
||||||
#include <vector>
|
#include <vector>
|
||||||
|
|
||||||
|
@ -32,8 +38,9 @@ SCENARIO("Searching ZIP files works")
|
||||||
opts.regex = epubgrep::options::regex_kind::extended;
|
opts.regex = epubgrep::options::regex_kind::extended;
|
||||||
matches = epubgrep::search::search(zipfile, "📙+\\w?", opts);
|
matches = epubgrep::search::search(zipfile, "📙+\\w?", opts);
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &e)
|
||||||
{
|
{
|
||||||
|
std::cerr << "EXCEPTION: " << e.what() << '\n';
|
||||||
exception = true;
|
exception = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -53,8 +60,9 @@ SCENARIO("Searching ZIP files works")
|
||||||
opts.context = 1;
|
opts.context = 1;
|
||||||
matches = epubgrep::search::search(zipfile, "📗", opts);
|
matches = epubgrep::search::search(zipfile, "📗", opts);
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &e)
|
||||||
{
|
{
|
||||||
|
std::cerr << "EXCEPTION: " << e.what() << '\n';
|
||||||
exception = true;
|
exception = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -78,8 +86,9 @@ SCENARIO("Searching ZIP files works")
|
||||||
matches = epubgrep::search::search(zipfile, R"([ \n])",
|
matches = epubgrep::search::search(zipfile, R"([ \n])",
|
||||||
opts);
|
opts);
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &e)
|
||||||
{
|
{
|
||||||
|
std::cerr << "EXCEPTION: " << e.what() << '\n';
|
||||||
exception = true;
|
exception = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -114,12 +123,13 @@ SCENARIO("Searching ZIP files works")
|
||||||
try
|
try
|
||||||
{
|
{
|
||||||
opts.context = 1;
|
opts.context = 1;
|
||||||
opts.regex = epubgrep::options::regex_kind::extended;
|
opts.regex = epubgrep::options::regex_kind::perl;
|
||||||
matches = epubgrep::search::search(
|
matches = epubgrep::search::search(
|
||||||
zipfile, R"(work\s[\w]+\.\W[\w']+\Wstay)", opts);
|
zipfile, R"(work\s[\w]+\.\W[\w']+\Wstay)", opts);
|
||||||
}
|
}
|
||||||
catch (const std::exception &)
|
catch (const std::exception &e)
|
||||||
{
|
{
|
||||||
|
std::cerr << "EXCEPTION: " << e.what() << '\n';
|
||||||
exception = true;
|
exception = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
@ -1,7 +1,12 @@
|
||||||
#include "fs-compat.hpp"
|
#include "fs-compat.hpp"
|
||||||
#include "zip.hpp"
|
#include "zip.hpp"
|
||||||
|
|
||||||
#include <catch.hpp>
|
// catch 3 does not have catch.hpp anymore
|
||||||
|
#if __has_include(<catch.hpp>)
|
||||||
|
# include <catch.hpp>
|
||||||
|
#else
|
||||||
|
# include <catch_all.hpp>
|
||||||
|
#endif
|
||||||
|
|
||||||
#include <clocale>
|
#include <clocale>
|
||||||
#include <exception>
|
#include <exception>
|
||||||
|
|
|
@ -1,22 +1,28 @@
|
||||||
msgid ""
|
msgid ""
|
||||||
msgstr ""
|
msgstr ""
|
||||||
"Project-Id-Version: epubgrep 0.5.0\n"
|
"Project-Id-Version: epubgrep 0.6.0\n"
|
||||||
"Report-Msgid-Bugs-To: \n"
|
"Report-Msgid-Bugs-To: \n"
|
||||||
"POT-Creation-Date: 2021-06-02 09:11+0200\n"
|
"POT-Creation-Date: 2021-08-20 17:06+0200\n"
|
||||||
"PO-Revision-Date: 2021-06-02 09:12+0200\n"
|
"PO-Revision-Date: 2021-08-20 17:07+0200\n"
|
||||||
"Last-Translator: tastytea <tastytea@tastytea.de>\n"
|
"Last-Translator: tastytea <tastytea@tastytea.de>\n"
|
||||||
"Language-Team: tastytea <https://schlomp.space/tastytea/epubgrep>\n"
|
"Language-Team: tastytea <https://schlomp.space/tastytea/epubgrep>\n"
|
||||||
"Language: de\n"
|
"Language: de\n"
|
||||||
"MIME-Version: 1.0\n"
|
"MIME-Version: 1.0\n"
|
||||||
"Content-Type: text/plain; charset=UTF-8\n"
|
"Content-Type: text/plain; charset=UTF-8\n"
|
||||||
"Content-Transfer-Encoding: 8bit\n"
|
"Content-Transfer-Encoding: 8bit\n"
|
||||||
"X-Generator: Poedit 2.4.3\n"
|
"X-Generator: Poedit 3.0\n"
|
||||||
"X-Poedit-Basepath: ..\n"
|
"X-Poedit-Basepath: ..\n"
|
||||||
"Plural-Forms: nplurals=2; plural=(n != 1);\n"
|
"Plural-Forms: nplurals=2; plural=(n != 1);\n"
|
||||||
"X-Poedit-SourceCharset: UTF-8\n"
|
"X-Poedit-SourceCharset: UTF-8\n"
|
||||||
"X-Poedit-KeywordsList: translate\n"
|
"X-Poedit-KeywordsList: translate\n"
|
||||||
"X-Poedit-SearchPath-0: .\n"
|
"X-Poedit-SearchPath-0: .\n"
|
||||||
|
|
||||||
|
# „Spine“ ist ein Fachbegriff, daher habe ich ihn nicht übersetzt.
|
||||||
|
#: src/book.cpp:284
|
||||||
|
msgid "{0:s} is damaged. Could not read spine. Skipping file.\n"
|
||||||
|
msgstr ""
|
||||||
|
"{0:s} ist beschädigt. Konnte „Spine“ nicht lesen. Überspringe Datei.\n"
|
||||||
|
|
||||||
#: src/log.cpp:70
|
#: src/log.cpp:70
|
||||||
msgid "WARNING"
|
msgid "WARNING"
|
||||||
msgstr "WARNUNG"
|
msgstr "WARNUNG"
|
||||||
|
@ -29,21 +35,29 @@ msgstr "FEHLER"
|
||||||
msgid "FATAL ERROR"
|
msgid "FATAL ERROR"
|
||||||
msgstr "SCHWERER FEHLER"
|
msgstr "SCHWERER FEHLER"
|
||||||
|
|
||||||
#: src/main.cpp:79
|
#: src/main.cpp:83
|
||||||
msgid " (while parsing options)"
|
msgid " (while parsing options)"
|
||||||
msgstr " (während Optionen interpretiert wurden)"
|
msgstr " (während Optionen interpretiert wurden)"
|
||||||
|
|
||||||
#: src/main.cpp:125
|
#: src/main.cpp:129
|
||||||
msgid "Could not open {0:s}: {1:s}"
|
msgid "Could not open {0:s}: {1:s}"
|
||||||
msgstr "Konnte {0:s} nicht öffnen: {1:s}"
|
msgstr "Konnte {0:s} nicht öffnen: {1:s}"
|
||||||
|
|
||||||
#: src/main.cpp:174
|
#: src/main.cpp:179
|
||||||
msgid " (while opening {0:s})"
|
msgid " (while opening {0:s})"
|
||||||
msgstr " (während {0:s} durchsucht wurde)"
|
msgstr " (während {0:s} durchsucht wurde)"
|
||||||
|
|
||||||
#: src/options.cpp:52
|
#: src/main.cpp:237
|
||||||
msgid "Available options"
|
msgid "{0:d} of {1:d} books searched."
|
||||||
msgstr "Verfügbare Optionen"
|
msgstr "{0:d} von {1:d} Büchern durchsucht."
|
||||||
|
|
||||||
|
#: src/main.cpp:241
|
||||||
|
msgid "All books searched."
|
||||||
|
msgstr "Alle Bücher durchsucht."
|
||||||
|
|
||||||
|
#: src/options.cpp:53
|
||||||
|
msgid "General options"
|
||||||
|
msgstr "Allgemeine Optionen"
|
||||||
|
|
||||||
#: src/options.cpp:56
|
#: src/options.cpp:56
|
||||||
msgid "Display this help and exit."
|
msgid "Display this help and exit."
|
||||||
|
@ -54,55 +68,76 @@ msgid "Display version information and exit."
|
||||||
msgstr "Versionsinformationen ausgeben und beenden."
|
msgstr "Versionsinformationen ausgeben und beenden."
|
||||||
|
|
||||||
#: src/options.cpp:60
|
#: src/options.cpp:60
|
||||||
|
msgid "Enable debug output."
|
||||||
|
msgstr "Debug-Ausgabe einschalten."
|
||||||
|
|
||||||
|
#: src/options.cpp:63
|
||||||
|
msgid "Search options"
|
||||||
|
msgstr "Suchoptionen"
|
||||||
|
|
||||||
|
#: src/options.cpp:66
|
||||||
msgid "PATTERN is a basic regular expression (default)."
|
msgid "PATTERN is a basic regular expression (default)."
|
||||||
msgstr "MUSTER ist eine „basic regular expression“ (standard)."
|
msgstr "MUSTER ist eine „basic regular expression“ (standard)."
|
||||||
|
|
||||||
#: src/options.cpp:63
|
#: src/options.cpp:69
|
||||||
msgid "PATTERN is an extended regular expression."
|
msgid "PATTERN is an extended regular expression."
|
||||||
msgstr "MUSTER ist eine „extended regular expression“."
|
msgstr "MUSTER ist eine „extended regular expression“."
|
||||||
|
|
||||||
#: src/options.cpp:65
|
#: src/options.cpp:71
|
||||||
msgid "Use grep-variation of regular expressions with -G and -E."
|
msgid "Use grep-variation of regular expressions with -G and -E."
|
||||||
msgstr "Benutze grep-Variante von regulären ausdrücken mit -G und -E."
|
msgstr "Benutze grep-Variante von regulären ausdrücken mit -G und -E."
|
||||||
|
|
||||||
#: src/options.cpp:68
|
#: src/options.cpp:74
|
||||||
msgid "PATTERN is a Perl regular expression."
|
msgid "PATTERN is a Perl regular expression."
|
||||||
msgstr "MUSTER ist ein regulärer Ausdruck, wie Perl ihn akzeptiert."
|
msgstr "MUSTER ist ein regulärer Ausdruck, wie Perl ihn akzeptiert."
|
||||||
|
|
||||||
#: src/options.cpp:70
|
#: src/options.cpp:77
|
||||||
msgid "Ignore case distinctions in pattern and data."
|
msgid "Ignore case distinctions in pattern and data."
|
||||||
msgstr "Unterschied zwischen Groß- und Kleinschreibung ignorieren."
|
msgstr "Unterschied zwischen Groß- und Kleinschreibung ignorieren."
|
||||||
|
|
||||||
#: src/options.cpp:73
|
#: src/options.cpp:80
|
||||||
msgid "PATTERN"
|
|
||||||
msgstr "MUSTER"
|
|
||||||
|
|
||||||
#: src/options.cpp:74
|
|
||||||
msgid "Use additional PATTERN for matching."
|
|
||||||
msgstr "Benutze zusätzliches MUSTER zum Abgleich."
|
|
||||||
|
|
||||||
#: src/options.cpp:76
|
|
||||||
msgid "Do not clean up text before searching."
|
msgid "Do not clean up text before searching."
|
||||||
msgstr "Nicht den Text vor dem suchen säubern."
|
msgstr "Nicht den Text vor dem suchen säubern."
|
||||||
|
|
||||||
#: src/options.cpp:78
|
#: src/options.cpp:82
|
||||||
|
msgid "Read all files under each directory, recursively."
|
||||||
|
msgstr "Lies rekursiv alle Dateien unter jedem Verzeichnis."
|
||||||
|
|
||||||
|
#: src/options.cpp:85
|
||||||
|
msgid "Read all files under each directory, recursively, following symlinks."
|
||||||
|
msgstr ""
|
||||||
|
"Lies rekursiv alle Dateien unter jedem Verzeichnis und folge dabei symlinks."
|
||||||
|
|
||||||
|
#: src/options.cpp:88
|
||||||
|
msgid "PATTERN"
|
||||||
|
msgstr "MUSTER"
|
||||||
|
|
||||||
|
#: src/options.cpp:89
|
||||||
|
msgid "Use additional PATTERN for matching."
|
||||||
|
msgstr "Benutze zusätzliches MUSTER zum Abgleich."
|
||||||
|
|
||||||
|
#: src/options.cpp:92
|
||||||
|
msgid "Output options"
|
||||||
|
msgstr "Ausgabeoptionen"
|
||||||
|
|
||||||
|
#: src/options.cpp:95 src/options.cpp:113
|
||||||
msgid "NUMBER"
|
msgid "NUMBER"
|
||||||
msgstr "ANZAHL"
|
msgstr "ANZAHL"
|
||||||
|
|
||||||
#: src/options.cpp:79
|
#: src/options.cpp:96
|
||||||
msgid "Print NUMBER words of context around matches."
|
msgid "Print NUMBER words of context around matches."
|
||||||
msgstr "ANZAHL Wörter an Kontext um die Treffer herum ausgeben."
|
msgstr "ANZAHL Wörter an Kontext um die Treffer herum ausgeben."
|
||||||
|
|
||||||
#: src/options.cpp:81
|
#: src/options.cpp:98
|
||||||
msgid "Turn off colors and other decorations."
|
msgid "Turn off colors and other decorations."
|
||||||
msgstr "Schalte Farben und andere Dekorationen aus."
|
msgstr "Schalte Farben und andere Dekorationen aus."
|
||||||
|
|
||||||
# Bezieht sich auf --no-filename.
|
# Bezieht sich auf --no-filename.
|
||||||
#: src/options.cpp:83
|
#: src/options.cpp:100
|
||||||
msgid "WHICH"
|
msgid "WHICH"
|
||||||
msgstr "WELCHE"
|
msgstr "WELCHE"
|
||||||
|
|
||||||
#: src/options.cpp:84
|
#: src/options.cpp:101
|
||||||
msgid ""
|
msgid ""
|
||||||
"Suppress the mentioning of file names on output. WHICH is ‘filesystem’, ‘in-"
|
"Suppress the mentioning of file names on output. WHICH is ‘filesystem’, ‘in-"
|
||||||
"epub’ or ‘all’."
|
"epub’ or ‘all’."
|
||||||
|
@ -110,32 +145,31 @@ msgstr ""
|
||||||
"Unterdrücke die Erwähnung der Dateinamens in der Ausgabe. WELCHE kann "
|
"Unterdrücke die Erwähnung der Dateinamens in der Ausgabe. WELCHE kann "
|
||||||
"‚filesystem‘, ‚in-epub‘ or ‚all‘ sein."
|
"‚filesystem‘, ‚in-epub‘ or ‚all‘ sein."
|
||||||
|
|
||||||
#: src/options.cpp:87
|
#: src/options.cpp:104
|
||||||
msgid "Read all files under each directory, recursively."
|
|
||||||
msgstr "Lies rekursiv alle Dateien unter jedem Verzeichnis."
|
|
||||||
|
|
||||||
#: src/options.cpp:90
|
|
||||||
msgid "Read all files under each directory, recursively, following symlinks."
|
|
||||||
msgstr ""
|
|
||||||
"Lies rekursiv alle Dateien unter jedem Verzeichnis und folge dabei symlinks."
|
|
||||||
|
|
||||||
#: src/options.cpp:93
|
|
||||||
msgid "Ignore errors about wrong file formats."
|
msgid "Ignore errors about wrong file formats."
|
||||||
msgstr "Ignoriere Fehlermeldungen wegen des falschen Dateiformats."
|
msgstr "Ignoriere Fehlermeldungen wegen des falschen Dateiformats."
|
||||||
|
|
||||||
#: src/options.cpp:95
|
#: src/options.cpp:106
|
||||||
msgid "Enable debug output."
|
|
||||||
msgstr "Debug-Ausgabe einschalten."
|
|
||||||
|
|
||||||
#: src/options.cpp:97
|
|
||||||
msgid "Output JSON instead of plain text."
|
msgid "Output JSON instead of plain text."
|
||||||
msgstr "Gib JSON statt Klartext aus."
|
msgstr "Gib JSON statt Klartext aus."
|
||||||
|
|
||||||
#: src/options.cpp:138
|
#: src/options.cpp:108
|
||||||
msgid "Usage: epubgrep [OPTION]… PATTERN [FILE]…\n"
|
msgid "Output HTML instead of plain text."
|
||||||
msgstr "Aufruf: epubgrep [OPTION]… MUSTER [DATEI]…\n"
|
msgstr "Output HTML instead of plain text."
|
||||||
|
|
||||||
#: src/options.cpp:140
|
#: src/options.cpp:110
|
||||||
|
msgid "Output status message every STATUS-INTERVAL seconds."
|
||||||
|
msgstr "Gebe alle STATUS-INTERVAL Sekunden eine Statusmeldung aus."
|
||||||
|
|
||||||
|
#: src/options.cpp:114
|
||||||
|
msgid "Set status message interval to NUMBER seconds."
|
||||||
|
msgstr "Setze Intervall für Statusmeldungen auf ANZAHL Sekunden."
|
||||||
|
|
||||||
|
#: src/options.cpp:162
|
||||||
|
msgid "Usage: epubgrep [OPTION]… PATTERN FILE…\n"
|
||||||
|
msgstr "Aufruf: epubgrep [OPTION]… MUSTER DATEI…\n"
|
||||||
|
|
||||||
|
#: src/options.cpp:164
|
||||||
msgid ""
|
msgid ""
|
||||||
"\n"
|
"\n"
|
||||||
"You can access the full manual with `man epubgrep`.\n"
|
"You can access the full manual with `man epubgrep`.\n"
|
||||||
|
@ -143,7 +177,7 @@ msgstr ""
|
||||||
"\n"
|
"\n"
|
||||||
"Du kannst mit `man epubgrep` auf das vollständige Handbuch zugreifen.\n"
|
"Du kannst mit `man epubgrep` auf das vollständige Handbuch zugreifen.\n"
|
||||||
|
|
||||||
#: src/options.cpp:147
|
#: src/options.cpp:171
|
||||||
msgid ""
|
msgid ""
|
||||||
"Copyright © 2021 tastytea <tastytea@tastytea.de>\n"
|
"Copyright © 2021 tastytea <tastytea@tastytea.de>\n"
|
||||||
"License AGPL-3.0-only <https://gnu.org/licenses/agpl.html>.\n"
|
"License AGPL-3.0-only <https://gnu.org/licenses/agpl.html>.\n"
|
||||||
|
@ -155,32 +189,51 @@ msgstr ""
|
||||||
"Für dieses Programm besteht KEINERLEI GARANTIE. Dies ist freie Software,\n"
|
"Für dieses Programm besteht KEINERLEI GARANTIE. Dies ist freie Software,\n"
|
||||||
"die Sie unter bestimmten Bedingungen weitergeben dürfen.\n"
|
"die Sie unter bestimmten Bedingungen weitergeben dürfen.\n"
|
||||||
|
|
||||||
#: src/output.cpp:51
|
#: src/output.cpp:47
|
||||||
msgid " In {0:s}: \n"
|
msgid " In {0:s}: \n"
|
||||||
msgstr " In {0:s}:\n"
|
msgstr " In {0:s}:\n"
|
||||||
|
|
||||||
#: src/zip.cpp:56 src/zip.cpp:84
|
# Sprache der Benutzeroberfläche.
|
||||||
|
#: src/output.cpp:145
|
||||||
|
msgid "en"
|
||||||
|
msgstr "de"
|
||||||
|
|
||||||
|
#: src/output.cpp:157
|
||||||
|
msgid "File {0:d}"
|
||||||
|
msgstr "Datei {0:d}"
|
||||||
|
|
||||||
|
#: src/output.cpp:172
|
||||||
|
msgid "File path (in EPUB file)"
|
||||||
|
msgstr "Dateipfad (innerhalb der EPUB Datei)"
|
||||||
|
|
||||||
|
#: src/output.cpp:176
|
||||||
|
msgid "Last headline"
|
||||||
|
msgstr "Letzte Überschrift"
|
||||||
|
|
||||||
|
#: src/output.cpp:179
|
||||||
|
msgid "Page number"
|
||||||
|
msgstr "Seitennummer"
|
||||||
|
|
||||||
|
#: src/output.cpp:182
|
||||||
|
msgid "Match"
|
||||||
|
msgstr "Treffer"
|
||||||
|
|
||||||
|
#: src/zip.cpp:55 src/zip.cpp:83
|
||||||
msgid "File in {0:s} is damaged. Skipping in-EPUB file.\n"
|
msgid "File in {0:s} is damaged. Skipping in-EPUB file.\n"
|
||||||
msgstr "Datei in {0:s} ist beschädigt. Überspringe Datei in der EPUB.\n"
|
msgstr "Datei in {0:s} ist beschädigt. Überspringe Datei in der EPUB.\n"
|
||||||
|
|
||||||
#: src/zip.cpp:104
|
#: src/zip.cpp:103
|
||||||
msgid "Could not read {0:s} in {1:s}."
|
msgid "Could not read {0:s} in {1:s}."
|
||||||
msgstr "Konnte {0:s} in {1:s} nicht lesen."
|
msgstr "Konnte {0:s} in {1:s} nicht lesen."
|
||||||
|
|
||||||
#: src/zip.cpp:119 src/zip.cpp:126
|
#: src/zip.cpp:118 src/zip.cpp:125
|
||||||
msgid "{0:s} not found in {1:s}."
|
msgid "{0:s} not found in {1:s}."
|
||||||
msgstr "{0:s} nicht gefunden in {1:s}."
|
msgstr "{0:s} nicht gefunden in {1:s}."
|
||||||
|
|
||||||
#: src/zip.cpp:149
|
#: src/zip.cpp:148
|
||||||
msgid "Could not open {0:s}."
|
msgid "Could not open {0:s}."
|
||||||
msgstr "Konnte {0:s} nicht öffnen."
|
msgstr "Konnte {0:s} nicht öffnen."
|
||||||
|
|
||||||
#: src/zip.cpp:163
|
#: src/zip.cpp:162
|
||||||
msgid "Could not close {0:s}."
|
msgid "Could not close {0:s}."
|
||||||
msgstr "Konnte {0:s} nicht schließen."
|
msgstr "Konnte {0:s} nicht schließen."
|
||||||
|
|
||||||
# „Spine“ ist ein Fachbegriff, daher habe ich ihn nicht übersetzt.
|
|
||||||
#: src/zip.cpp:232
|
|
||||||
msgid "{0:s} is damaged. Could not read spine. Skipping file.\n"
|
|
||||||
msgstr ""
|
|
||||||
"{0:s} ist beschädigt. Konnte „Spine“ nicht lesen. Überspringe Datei.\n"
|
|
||||||
|
|
Loading…
Reference in New Issue