BigW Consortium Gitlab

regex.rb 5.01 KB
Newer Older
1 2 3 4
module Gitlab
  module Regex
    extend self

5 6 7 8 9 10
    # The namespace regex is used in Javascript to validate usernames in the "Register" form. However, Javascript
    # does not support the negative lookbehind assertion (?<!) that disallows usernames ending in `.git` and `.atom`.
    # Since this is a non-trivial problem to solve in Javascript (heavily complicate the regex, modify view code to
    # allow non-regex validatiions, etc), `NAMESPACE_REGEX_STR_SIMPLE` serves as a Javascript-compatible version of
    # `NAMESPACE_REGEX_STR`, with the negative lookbehind assertion removed. This means that the client-side validation
    # will pass for usernames ending in `.atom` and `.git`, but will be caught by the server-side validation.
11 12
    PATH_REGEX_STR = '[a-zA-Z0-9_\.][a-zA-Z0-9_\-\.]*'.freeze
    NAMESPACE_REGEX_STR_SIMPLE = PATH_REGEX_STR + '[a-zA-Z0-9_\-]|[a-zA-Z0-9_]'.freeze
13
    NAMESPACE_REGEX_STR = '(?:' + NAMESPACE_REGEX_STR_SIMPLE + ')(?<!\.git|\.atom)'.freeze
14
    PROJECT_REGEX_STR = PATH_REGEX_STR + '(?<!\.git|\.atom)'.freeze
15

16 17 18 19
    # Same as NAMESPACE_REGEX_STR but allows `/` in the path.
    # So `group/subgroup` will match this regex but not NAMESPACE_REGEX_STR
    NAMESPACE_REF_REGEX_STR = '(?:[a-zA-Z0-9_\.][a-zA-Z0-9_\-\.\/]*[a-zA-Z0-9_\-]|[a-zA-Z0-9_])(?<!\.git|\.atom)'.freeze

20 21
    def namespace_regex
      @namespace_regex ||= /\A#{NAMESPACE_REGEX_STR}\z/.freeze
22 23
    end

24 25 26 27
    def namespace_route_regex
      @namespace_route_regex ||= /#{NAMESPACE_REGEX_STR}/.freeze
    end

28
    def namespace_regex_message
29
      "can contain only letters, digits, '_', '-' and '.'. " \
30
      "Cannot start with '-' or end in '.', '.git' or '.atom'." \
31 32 33
    end

    def namespace_name_regex
34
      @namespace_name_regex ||= /\A[\p{Alnum}\p{Pd}_\. ]*\z/.freeze
35 36
    end

37
    def namespace_name_regex_message
38
      "can contain only letters, digits, '_', '.', dash and space."
39 40
    end

41
    def project_name_regex
42
      @project_name_regex ||= /\A[\p{Alnum}\u{00A9}-\u{1f9c0}_][\p{Alnum}\p{Pd}\u{00A9}-\u{1f9c0}_\. ]*\z/.freeze
43 44
    end

45
    def project_name_regex_message
46 47
      "can contain only letters, digits, emojis, '_', '.', dash, space. " \
      "It must start with letter, digit, emoji or '_'."
48 49
    end

50
    def project_path_regex
51 52 53 54 55 56 57 58 59
      @project_path_regex ||= /\A#{PROJECT_REGEX_STR}\z/.freeze
    end

    def project_route_regex
      @project_route_regex ||= /#{PROJECT_REGEX_STR}/.freeze
    end

    def project_git_route_regex
      @project_route_git_regex ||= /#{PATH_REGEX_STR}\.git/.freeze
60 61
    end

62 63
    def project_path_regex_message
      "can contain only letters, digits, '_', '-' and '.'. " \
64
      "Cannot start with '-', end in '.git' or end in '.atom'" \
65 66
    end

67
    def file_name_regex
68
      @file_name_regex ||= /\A[[[:alnum:]]_\-\.\@\+]*\z/.freeze
69
    end
70

71
    def file_name_regex_message
72
      "can contain only letters, digits, '_', '-', '@', '+' and '.'."
73 74
    end

75
    def file_path_regex
76
      @file_path_regex ||= /\A[[[:alnum:]]_\-\.\/\@]*\z/.freeze
77 78 79
    end

    def file_path_regex_message
80
      "can contain only letters, digits, '_', '-', '@' and '.'. Separate directories with a '/'."
81 82 83 84 85 86 87
    end

    def directory_traversal_regex
      @directory_traversal_regex ||= /\.{2}/.freeze
    end

    def directory_traversal_regex_message
88
      "cannot include directory traversal."
89 90
    end

91
    def archive_formats_regex
92 93
      #                           |zip|tar|    tar.gz    |         tar.bz2         |
      @archive_formats_regex ||= /(zip|tar|tar\.gz|tgz|gz|tar\.bz2|tbz|tbz2|tb2|bz2)/.freeze
94
    end
95

96 97 98 99
    def git_reference_regex
      # Valid git ref regex, see:
      # https://www.kernel.org/pub/software/scm/git/docs/git-check-ref-format.html

100
      @git_reference_regex ||= %r{
101
        (?!
102 103 104
           (?# doesn't begins with)
           \/|                    (?# rule #6)
           (?# doesn't contain)
105
           .*(?:
106 107 108 109
              [\/.]\.|            (?# rule #1,3)
              \/\/|               (?# rule #6)
              @\{|                (?# rule #8)
              \\                  (?# rule #9)
110 111
           )
        )
112 113 114 115
        [^\000-\040\177~^:?*\[]+  (?# rule #4-5)
        (?# doesn't end with)
        (?<!\.lock)               (?# rule #1)
        (?<![\/.])                (?# rule #6-7)
116
      }x.freeze
117
    end
118

Kamil Trzcinski committed
119
    def container_registry_reference_regex
120 121
      git_reference_regex
    end
122 123

    def environment_name_regex
124
      @environment_name_regex ||= /\A[a-zA-Z0-9_\\\/\${}. -]+\z/.freeze
125 126 127
    end

    def environment_name_regex_message
128
      "can contain only letters, digits, '-', '_', '/', '$', '{', '}', '.' and spaces"
129
    end
130 131 132 133 134 135 136 137

    def kubernetes_namespace_regex
      /\A[a-z0-9]([-a-z0-9]*[a-z0-9])?\z/
    end

    def kubernetes_namespace_regex_message
      "can contain only letters, digits or '-', and cannot start or end with '-'"
    end
Nick Thomas committed
138 139 140 141 142 143 144 145 146

    def environment_slug_regex
      @environment_slug_regex ||= /\A[a-z]([a-z0-9-]*[a-z0-9])?\z/.freeze
    end

    def environment_slug_regex_message
      "can contain only lowercase letters, digits, and '-'. " \
      "Must start with a letter, and cannot end with '-'"
    end
147 148
  end
end