Merge bd773db956 into b07c0ae39f

[fix] annas archive: crash when no thumbnail, differing results, paging
[upd] pypi: Bump selenium from 4.25.0 to 4.26.1
2024-11-01 14:37:50 +01:00 · 2024-11-01 12:49:33 +01:00 · 2024-11-01 10:07:59 +00:00 · 2024-11-01 10:14:57 +01:00
3 changed files with 17 additions and 16 deletions
--- a/.github/workflows/integration.yml
+++ b/.github/workflows/integration.yml
@ -45,14 +45,6 @@ jobs:
        make V=1 gecko.driver
    - name: Run tests
      run: make V=1 ci.test
-    - name: Test coverage
-      run: make V=1 test.coverage
-    - name: Store coverage result
-      uses: actions/upload-artifact@v3
-      with:
-        name: coverage-${{ matrix.python-version }}
-        path: coverage/
-        retention-days: 60

  themes:
    name: Themes
--- a/requirements-dev.txt
+++ b/requirements-dev.txt
@ -4,7 +4,7 @@ cov-core==1.15.0
 black==24.3.0
 pylint==3.3.1
 splinter==0.21.0
-selenium==4.25.0
+selenium==4.26.1
 Pallets-Sphinx-Themes==2.3.0
 Sphinx==7.4.7
 sphinx-issues==5.0.0
--- a/searx/engines/annas_archive.py
+++ b/searx/engines/annas_archive.py
@ -34,10 +34,10 @@ Implementations
 """

 from typing import List, Dict, Any, Optional
-from urllib.parse import quote
+from urllib.parse import urlencode
 from lxml import html

-from searx.utils import extract_text, eval_xpath, eval_xpath_list
+from searx.utils import extract_text, eval_xpath, eval_xpath_getindex, eval_xpath_list
 from searx.enginelib.traits import EngineTraits
 from searx.data import ENGINE_TRAITS

@ -53,7 +53,7 @@ about: Dict[str, Any] = {

 # engine dependent config
 categories: List[str] = ["files"]
-paging: bool = False
+paging: bool = True

 # search-url
 base_url: str = "https://annas-archive.org"
@ -99,9 +99,18 @@ def init(engine_settings=None):  # pylint: disable=unused-argument


 def request(query, params: Dict[str, Any]) -> Dict[str, Any]:
-    q = quote(query)
    lang = traits.get_language(params["language"], traits.all_locale)  # type: ignore
-    params["url"] = base_url + f"/search?lang={lang or ''}&content={aa_content}&ext={aa_ext}&sort={aa_sort}&q={q}"
+    args = {
+        'lang': lang,
+        'content': aa_content,
+        'ext': aa_ext,
+        'sort': aa_sort,
+        'q': query,
+        'page': params['pageno'],
+    }
+    # filter out None and empty values
+    filtered_args = dict((k, v) for k, v in args.items() if v)
+    params["url"] = f"{base_url}/search?{urlencode(filtered_args)}"
    return params


@ -128,12 +137,12 @@ def response(resp) -> List[Dict[str, Optional[str]]]:
 def _get_result(item):
    return {
        'template': 'paper.html',
-        'url': base_url + item.xpath('./@href')[0],
+        'url': base_url + extract_text(eval_xpath_getindex(item, './@href', 0)),
        'title': extract_text(eval_xpath(item, './/h3/text()[1]')),
        'publisher': extract_text(eval_xpath(item, './/div[contains(@class, "text-sm")]')),
        'authors': [extract_text(eval_xpath(item, './/div[contains(@class, "italic")]'))],
        'content': extract_text(eval_xpath(item, './/div[contains(@class, "text-xs")]')),
-        'thumbnail': item.xpath('.//img/@src')[0],
+        'thumbnail': extract_text(eval_xpath_getindex(item, './/img/@src', 0, default=None), allow_none=True),
    }
Author	SHA1	Message	Date
dependabot[bot]	dd40c6d610	Merge `bd773db956` into `b07c0ae39f`	2024-11-01 14:37:50 +01:00
Bnyro	b07c0ae39f	[fix] annas archive: crash when no thumbnail, differing results, paging	2024-11-01 12:49:33 +01:00
dependabot[bot]	bd773db956	[upd] pypi: Bump selenium from 4.25.0 to 4.26.1 Bumps [selenium](https://github.com/SeleniumHQ/Selenium) from 4.25.0 to 4.26.1. - [Release notes](https://github.com/SeleniumHQ/Selenium/releases) - [Commits](https://github.com/SeleniumHQ/Selenium/commits) --- updated-dependencies: - dependency-name: selenium dependency-type: direct:development update-type: version-update:semver-minor ... Signed-off-by: dependabot[bot] <support@github.com>	2024-11-01 10:07:59 +00:00
Markus Heiser	56e3d72a76	[fix] CI: remove target test.coverage from python's test matrix The test.coverage cause a lot of failed CI jobs for reasons that cannot be explained. As we do not monitor the coverage anyway, it is superfluous to run this job, especially as it only has a disruptive effect on the CI. BTW and the CI action upload-artifact@v3 is deprecated [1] [1] https://github.com/actions/upload-artifact?tab=readme-ov-file#actionsupload-artifact Related: https://github.com/searxng/searxng/issues/3983 Signed-off-by: Markus Heiser <markus.heiser@darmarit.de>	2024-11-01 10:14:57 +01:00