google_play.py 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117
  1. # SPDX-License-Identifier: AGPL-3.0-or-later
  2. # lint: pylint
  3. """Google Play Apps & Google Play Movies
  4. """
  5. from urllib.parse import urlencode
  6. from lxml import html
  7. from searx.utils import (
  8. eval_xpath,
  9. extract_url,
  10. extract_text,
  11. eval_xpath_list,
  12. eval_xpath_getindex,
  13. )
  14. about = {
  15. "website": "https://play.google.com/",
  16. "wikidata_id": "Q79576",
  17. "use_official_api": False,
  18. "require_api_key": False,
  19. "results": "HTML",
  20. }
  21. send_accept_language_header = True
  22. play_categ = None # apps|movies
  23. base_url = 'https://play.google.com'
  24. search_url = base_url + "/store/search?{query}&c={play_categ}"
  25. def request(query, params):
  26. if play_categ not in ('movies', 'apps'):
  27. raise ValueError(f"unknown google play category: {play_categ}")
  28. params["url"] = search_url.format(
  29. query=urlencode({"q": query}),
  30. play_categ=play_categ,
  31. )
  32. params['cookies']['CONSENT'] = "YES+"
  33. return params
  34. def response(resp):
  35. if play_categ == 'movies':
  36. return response_movies(resp)
  37. if play_categ == 'apps':
  38. return response_apps(resp)
  39. raise ValueError(f"Unsupported play category: {play_categ}")
  40. def response_movies(resp):
  41. results = []
  42. dom = html.fromstring(resp.text)
  43. for section in eval_xpath(dom, '//c-wiz/section/header/..'):
  44. sec_name = extract_text(eval_xpath(section, './header'))
  45. for item in eval_xpath(section, './/a'):
  46. url = base_url + item.get('href')
  47. div_1, div_2 = eval_xpath(item, './div')[:2]
  48. title = extract_text(eval_xpath(div_2, './div[@title]'))
  49. metadata = extract_text(eval_xpath(div_2, './div[@class]'))
  50. img = eval_xpath(div_1, './/img')[0]
  51. img_src = img.get('src')
  52. results.append(
  53. {
  54. "url": url,
  55. "title": title,
  56. "content": sec_name,
  57. "img_src": img_src,
  58. 'metadata': metadata,
  59. 'template': 'videos.html',
  60. }
  61. )
  62. return results
  63. def response_apps(resp):
  64. results = []
  65. dom = html.fromstring(resp.text)
  66. if eval_xpath(dom, '//div[@class="v6DsQb"]'):
  67. return []
  68. spot = eval_xpath_getindex(dom, '//div[@class="ipRz4"]', 0, None)
  69. if spot is not None:
  70. url = extract_url(eval_xpath(spot, './a[@class="Qfxief"]/@href'), search_url)
  71. title = extract_text(eval_xpath(spot, './/div[@class="vWM94c"]'))
  72. content = extract_text(eval_xpath(spot, './/div[@class="LbQbAe"]'))
  73. img = extract_text(eval_xpath(spot, './/img[@class="T75of bzqKMd"]/@src'))
  74. results.append({"url": url, "title": title, "content": content, "img_src": img})
  75. more = eval_xpath_list(dom, '//c-wiz[@jsrenderer="RBsfwb"]//div[@role="listitem"]', min_len=1)
  76. for result in more:
  77. url = extract_url(eval_xpath(result, ".//a/@href"), search_url)
  78. title = extract_text(eval_xpath(result, './/span[@class="DdYX5"]'))
  79. content = extract_text(eval_xpath(result, './/span[@class="wMUdtb"]'))
  80. img = extract_text(
  81. eval_xpath(
  82. result,
  83. './/img[@class="T75of stzEZd" or @class="T75of etjhNc Q8CSx "]/@src',
  84. )
  85. )
  86. results.append({"url": url, "title": title, "content": content, "img_src": img})
  87. for suggestion in eval_xpath_list(dom, '//c-wiz[@jsrenderer="qyd4Kb"]//div[@class="ULeU3b neq64b"]'):
  88. results.append({"suggestion": extract_text(eval_xpath(suggestion, './/div[@class="Epkrse "]'))})
  89. return results