regexes.py 6.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164
  1. # vim:set et sw=4:
  2. """
  3. Central repository of regexes for dak
  4. @contact: Debian FTP Master <ftpmaster@debian.org>
  5. @copyright: 2001, 2002, 2003, 2004, 2005, 2006 James Troup <james@nocrew.org>
  6. @copyright: 2009 Mark Hymers <mhy@debian.org>
  7. @copyright: 2009, 2010 Joerg Jaspert <joerg@debian.org>
  8. @license: GNU General Public License version 2 or later
  9. """
  10. # This program is free software; you can redistribute it and/or modify
  11. # it under the terms of the GNU General Public License as published by
  12. # the Free Software Foundation; either version 2 of the License, or
  13. # (at your option) any later version.
  14. # This program is distributed in the hope that it will be useful,
  15. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  16. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  17. # GNU General Public License for more details.
  18. # You should have received a copy of the GNU General Public License
  19. # along with this program; if not, write to the Free Software
  20. # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  21. ###############################################################################
  22. import re
  23. #: Is it a number?
  24. re_isanum = re.compile(r"^\d+$")
  25. #: Looking for the default reply
  26. re_default_answer = re.compile(r"\[(.*)\]")
  27. #: Detect a binnmu
  28. re_bin_only_nmu = re.compile(r"\+b\d+$")
  29. #: To sort out comment lines
  30. re_comments = re.compile(r"\#.*")
  31. #: To ignore comment and whitespace lines.
  32. re_whitespace_comment = re.compile(r"^\s*(#|$)")
  33. re_no_epoch = re.compile(r"^\d+\:")
  34. re_extract_src_version = re.compile(r"(\S+)\s*\((.*)\)")
  35. re_isadeb = re.compile(r"(.+?)_(.+?)_(.+)\.u?deb$")
  36. orig_source_ext_re = r"orig(?:-[a-zA-Z0-9-]+)?\.tar\.(?:gz|bz2|xz)(?:\.asc)?"
  37. file_source_ext_re = "(" + orig_source_ext_re + r"|(?:debian\.)?tar\.(?:gz|bz2|xz)|diff\.gz)"
  38. re_source_ext = re.compile("(" + file_source_ext_re + r"|dsc)$")
  39. re_issource = re.compile(r"(.+)_(.+?)\." + re_source_ext.pattern)
  40. re_single_line_field = re.compile(r"^(\S*?)\s*:\s*(.*)")
  41. re_multi_line_field = re.compile(r"^\s(.*)")
  42. re_taint_free = re.compile(r"^[-+~/\.\w]+$")
  43. re_parse_maintainer = re.compile(r"^\s*(\S.*\S)\s*\<([^\>]+)\>")
  44. re_srchasver = re.compile(r"^(\S+)\s+\((\S+)\)$")
  45. re_verwithext = re.compile(r"^(\d+)(?:\.(\d+))(?:\s+\((\S+)\))?$")
  46. # From clean_proposed_updates.py
  47. re_isdeb = re.compile(r"^(.+)_(.+?)_(.+?).u?deb$")
  48. # From examine_package.py
  49. re_package = re.compile(r"^(.+?)_.*")
  50. re_doc_directory = re.compile(r".*/doc/([^/]*).*")
  51. re_contrib = re.compile('^contrib/')
  52. re_nonfree = re.compile('^(?:non-free-firmware|non-free)/')
  53. re_localhost = re.compile(r"localhost\.localdomain")
  54. re_version = re.compile(r'^(.*)\((.*)\)')
  55. re_newlinespace = re.compile('\n')
  56. re_spacestrip = re.compile(r'(\s)')
  57. # From new_security_install.py
  58. re_taint_free = re.compile(r"^['/;\-\+\.~\s\w]+$")
  59. # From process_unchecked.py
  60. re_changelog_versions = re.compile(r"^\w[-+0-9a-z.]+ \([^\(\) \t]+\)")
  61. # From dak/rm.py
  62. re_strip_source_version = re.compile(r'\s+.*$')
  63. re_build_dep_arch = re.compile(r"\[[^]]+\]")
  64. # From dak/transitions.py
  65. re_broken_package = re.compile(r"[a-zA-Z]\w+\s+\-.*")
  66. # From dak/add_user.py
  67. re_gpg_fingerprint_colon = re.compile(r"^fpr:+(.*):$", re.MULTILINE)
  68. # The next one is dirty
  69. re_user_address = re.compile(r"^pub:.*<(.*)@.*>.*$", re.MULTILINE)
  70. re_user_mails = re.compile(r"^(pub|uid):[^rdin].*<(.*@.*)>.*$", re.MULTILINE)
  71. re_user_name = re.compile(r"^pub:.*:(.*)<.*$", re.MULTILINE)
  72. re_re_mark = re.compile(r'^RE:')
  73. re_parse_lintian = re.compile(r"^(?P<level>W|E|O): (?P<package>.*?): (?P<tag>[^ ]*) ?(?P<description>.*)$")
  74. # in generate-releases
  75. re_gensubrelease = re.compile(r".*/(binary-[0-9a-z-]+|source)$")
  76. re_includeinrelease_byhash = re.compile(r"(Translation-[a-zA-Z_]+\.(?:bz2|xz|zst)|Contents-[0-9a-z-]+.gz|Index|Packages(.gz|.bz2|.xz|.zst)?|Sources(.gz|.bz2|.xz|.zst)?|Components-[0-9a-z-]+.yml(.gz|.xz)|icons-[0-9x-]+.tar(.gz|.xz)|Release)$")
  77. re_includeinrelease_plain = re.compile(r"(MD5SUMS|SHA256SUMS)$")
  78. # in generate_index_diffs
  79. re_includeinpdiff = re.compile(r"(Translation-[a-zA-Z_]+\.(?:bz2|xz|zst))")
  80. ######################################################################
  81. # Patterns matching filenames #
  82. ######################################################################
  83. # Match safe filenames
  84. re_file_safe = re.compile(r'^[a-zA-Z0-9][a-zA-Z0-9_.~+-]*$')
  85. # Match safe filenames, including slashes
  86. re_file_safe_slash = re.compile(r'^[a-zA-Z0-9][/a-zA-Z0-9_.~+-]*$')
  87. # Prefix of binary and source filenames
  88. _re_file_prefix = r'^(?P<package>[a-z0-9][a-z0-9.+-]+)_(?P<version>[A-Za-z0-9.~+-]+?)'
  89. # Match binary packages
  90. # Groups: package, version, architecture, type
  91. re_file_binary = re.compile(_re_file_prefix + r'_(?P<architecture>[a-z0-9-]+)\.(?P<type>u?deb)$')
  92. # Match changes files
  93. # Groups: package, version, suffix
  94. re_file_changes = re.compile(_re_file_prefix + r'_(?P<suffix>[a-zA-Z0-9+-]+)\.changes$')
  95. # Match dsc files
  96. # Groups: package, version
  97. re_file_dsc = re.compile(_re_file_prefix + r'\.dsc$')
  98. # Match other source files
  99. # Groups: package, version
  100. re_file_source = re.compile(_re_file_prefix + r'\.' + file_source_ext_re)
  101. # Match upstream tarball
  102. # Groups: package, version
  103. re_file_orig = re.compile(_re_file_prefix + r'\.' + orig_source_ext_re)
  104. # Match buildinfo file
  105. # Groups: package, version, suffix
  106. re_file_buildinfo = re.compile(_re_file_prefix + r'_(?P<suffix>[a-zA-Z0-9+-]+)\.buildinfo$')
  107. ######################################################################
  108. # Patterns matching fields #
  109. ######################################################################
  110. # Match package name
  111. re_field_package = re.compile(r'^[a-z0-9][a-z0-9.+-]+$')
  112. # Match version
  113. # Groups: without-epoch
  114. re_field_version = re.compile(r'^(?:[0-9]+:)?(?P<without_epoch>[A-Za-z0-9.:~+-]+)$')
  115. # Extract upstream version
  116. # Groups: upstream
  117. re_field_version_upstream = re.compile(r'^(?:[0-9]+:)?(?P<upstream>.*)-[^-]*$')
  118. # Match source field
  119. # Groups: package, version
  120. re_field_source = re.compile(r'^(?P<package>[a-z0-9][a-z0-9.+-]+)(?:\s*\((?P<version>[A-Za-z0-9.:~+-]+)\))?$')