123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351 |
- #
- #
- # Nim Grep Utility
- # (c) Copyright 2012 Andreas Rumpf
- #
- # See the file "copying.txt", included in this
- # distribution, for details about the copyright.
- #
- import
- os, strutils, parseopt, pegs, re, terminal
- const
- Version = "1.2"
- Usage = "nimgrep - Nim Grep Utility Version " & Version & """
- (c) 2012 Andreas Rumpf
- Usage:
- nimgrep [options] [pattern] [replacement] (file/directory)*
- Options:
- --find, -f find the pattern (default)
- --replace, -r replace the pattern
- --peg pattern is a peg
- --re pattern is a regular expression (default); extended
- syntax for the regular expression is always turned on
- --recursive process directories recursively
- --confirm confirm each occurrence/replacement; there is a chance
- to abort any time without touching the file
- --stdin read pattern from stdin (to avoid the shell's confusing
- quoting rules)
- --word, -w the match should have word boundaries (buggy for pegs!)
- --ignoreCase, -i be case insensitive
- --ignoreStyle, -y be style insensitive
- --ext:EX1|EX2|... only search the files with the given extension(s)
- --nocolor output will be given without any colours.
- --oneline show file on each matched line
- --verbose be verbose: list every processed file
- --filenames find the pattern in the filenames, not in the contents
- of the file
- --help, -h shows this help
- --version, -v shows the version
- """
- type
- TOption = enum
- optFind, optReplace, optPeg, optRegex, optRecursive, optConfirm, optStdin,
- optWord, optIgnoreCase, optIgnoreStyle, optVerbose, optFilenames
- TOptions = set[TOption]
- TConfirmEnum = enum
- ceAbort, ceYes, ceAll, ceNo, ceNone
- Pattern = Regex | Peg
- using pattern: Pattern
- var
- filenames: seq[string] = @[]
- pattern = ""
- replacement = ""
- extensions: seq[string] = @[]
- options: TOptions = {optRegex}
- useWriteStyled = true
- oneline = false
- proc ask(msg: string): string =
- stdout.write(msg)
- stdout.flushFile()
- result = stdin.readLine()
- proc confirm: TConfirmEnum =
- while true:
- case normalize(ask(" [a]bort; [y]es, a[l]l, [n]o, non[e]: "))
- of "a", "abort": return ceAbort
- of "y", "yes": return ceYes
- of "l", "all": return ceAll
- of "n", "no": return ceNo
- of "e", "none": return ceNone
- else: discard
- proc countLines(s: string, first, last: int): int =
- var i = first
- while i <= last:
- if s[i] == '\13':
- inc result
- if i < last and s[i+1] == '\10': inc(i)
- elif s[i] == '\10':
- inc result
- inc i
- proc beforePattern(s: string, first: int): int =
- result = first-1
- while result >= 0:
- if s[result] in NewLines: break
- dec(result)
- inc(result)
- proc afterPattern(s: string, last: int): int =
- result = last+1
- while result < s.len:
- if s[result] in NewLines: break
- inc(result)
- dec(result)
- proc writeColored(s: string) =
- if useWriteStyled:
- terminal.writeStyled(s, {styleUnderscore, styleBright})
- else:
- stdout.write(s)
- proc highlight(s, match, repl: string, t: tuple[first, last: int],
- filename:string, line: int, showRepl: bool) =
- const alignment = 6
- if oneline:
- stdout.write(filename, ":", line, ": ")
- else:
- stdout.write(line.`$`.align(alignment), ": ")
- var x = beforePattern(s, t.first)
- var y = afterPattern(s, t.last)
- for i in x .. t.first-1: stdout.write(s[i])
- writeColored(match)
- for i in t.last+1 .. y: stdout.write(s[i])
- stdout.write("\n")
- stdout.flushFile()
- if showRepl:
- stdout.write(spaces(alignment-1), "-> ")
- for i in x .. t.first-1: stdout.write(s[i])
- writeColored(repl)
- for i in t.last+1 .. y: stdout.write(s[i])
- stdout.write("\n")
- stdout.flushFile()
- proc processFile(pattern; filename: string; counter: var int) =
- var filenameShown = false
- template beforeHighlight =
- if not filenameShown and optVerbose notin options and not oneline:
- stdout.writeLine(filename)
- stdout.flushFile()
- filenameShown = true
- var buffer: string
- if optFilenames in options:
- buffer = filename
- else:
- try:
- buffer = system.readFile(filename)
- except IOError:
- echo "cannot open file: ", filename
- return
- if optVerbose in options:
- stdout.writeLine(filename)
- stdout.flushFile()
- var result: string
- if optReplace in options:
- result = newStringOfCap(buffer.len)
- var line = 1
- var i = 0
- var matches: array[0..re.MaxSubpatterns-1, string]
- for j in 0..high(matches): matches[j] = ""
- var reallyReplace = true
- while i < buffer.len:
- let t = findBounds(buffer, pattern, matches, i)
- if t.first < 0: break
- inc(line, countLines(buffer, i, t.first-1))
- var wholeMatch = buffer.substr(t.first, t.last)
- beforeHighlight()
- inc counter
- if optReplace notin options:
- highlight(buffer, wholeMatch, "", t, filename, line, showRepl=false)
- else:
- let r = replace(wholeMatch, pattern, replacement % matches)
- if optConfirm in options:
- highlight(buffer, wholeMatch, r, t, filename, line, showRepl=true)
- case confirm()
- of ceAbort: quit(0)
- of ceYes: reallyReplace = true
- of ceAll:
- reallyReplace = true
- options.excl(optConfirm)
- of ceNo:
- reallyReplace = false
- of ceNone:
- reallyReplace = false
- options.excl(optConfirm)
- else:
- highlight(buffer, wholeMatch, r, t, filename, line, showRepl=reallyReplace)
- if reallyReplace:
- result.add(buffer.substr(i, t.first-1))
- result.add(r)
- else:
- result.add(buffer.substr(i, t.last))
- inc(line, countLines(buffer, t.first, t.last))
- i = t.last+1
- if optReplace in options:
- result.add(substr(buffer, i))
- var f: File
- if open(f, filename, fmWrite):
- f.write(result)
- f.close()
- else:
- quit "cannot open file for overwriting: " & filename
- proc hasRightExt(filename: string, exts: seq[string]): bool =
- var y = splitFile(filename).ext.substr(1) # skip leading '.'
- for x in items(exts):
- if os.cmpPaths(x, y) == 0: return true
- proc styleInsensitive(s: string): string =
- template addx =
- result.add(s[i])
- inc(i)
- result = ""
- var i = 0
- var brackets = 0
- while i < s.len:
- case s[i]
- of 'A'..'Z', 'a'..'z', '0'..'9':
- addx()
- if brackets == 0: result.add("_?")
- of '_':
- addx()
- result.add('?')
- of '[':
- addx()
- inc(brackets)
- of ']':
- addx()
- if brackets > 0: dec(brackets)
- of '?':
- addx()
- if s[i] == '<':
- addx()
- while s[i] != '>' and s[i] != '\0': addx()
- of '\\':
- addx()
- if s[i] in strutils.Digits:
- while s[i] in strutils.Digits: addx()
- else:
- addx()
- else: addx()
- proc walker(pattern; dir: string; counter: var int) =
- for kind, path in walkDir(dir):
- case kind
- of pcFile:
- if extensions.len == 0 or path.hasRightExt(extensions):
- processFile(pattern, path, counter)
- of pcDir:
- if optRecursive in options:
- walker(pattern, path, counter)
- else: discard
- if existsFile(dir): processFile(pattern, dir, counter)
- proc writeHelp() =
- stdout.write(Usage)
- stdout.flushFile()
- quit(0)
- proc writeVersion() =
- stdout.write(Version & "\n")
- stdout.flushFile()
- quit(0)
- proc checkOptions(subset: TOptions, a, b: string) =
- if subset <= options:
- quit("cannot specify both '$#' and '$#'" % [a, b])
- for kind, key, val in getopt():
- case kind
- of cmdArgument:
- if options.contains(optStdin):
- filenames.add(key)
- elif pattern.len == 0:
- pattern = key
- elif options.contains(optReplace) and replacement.len == 0:
- replacement = key
- else:
- filenames.add(key)
- of cmdLongoption, cmdShortOption:
- case normalize(key)
- of "find", "f": incl(options, optFind)
- of "replace", "r": incl(options, optReplace)
- of "peg":
- excl(options, optRegex)
- incl(options, optPeg)
- of "re":
- incl(options, optRegex)
- excl(options, optPeg)
- of "recursive": incl(options, optRecursive)
- of "confirm": incl(options, optConfirm)
- of "stdin": incl(options, optStdin)
- of "word", "w": incl(options, optWord)
- of "ignorecase", "i": incl(options, optIgnoreCase)
- of "ignorestyle", "y": incl(options, optIgnoreStyle)
- of "ext": extensions.add val.split('|')
- of "nocolor": useWriteStyled = false
- of "oneline": oneline = true
- of "verbose": incl(options, optVerbose)
- of "filenames": incl(options, optFilenames)
- of "help", "h": writeHelp()
- of "version", "v": writeVersion()
- else: writeHelp()
- of cmdEnd: assert(false) # cannot happen
- when defined(posix):
- useWriteStyled = terminal.isatty(stdout)
- checkOptions({optFind, optReplace}, "find", "replace")
- checkOptions({optPeg, optRegex}, "peg", "re")
- checkOptions({optIgnoreCase, optIgnoreStyle}, "ignore_case", "ignore_style")
- checkOptions({optFilenames, optReplace}, "filenames", "replace")
- if optStdin in options:
- pattern = ask("pattern [ENTER to exit]: ")
- if pattern.len == 0: quit(0)
- if optReplace in options:
- replacement = ask("replacement [supports $1, $# notations]: ")
- if pattern.len == 0:
- writeHelp()
- else:
- var counter = 0
- if filenames.len == 0:
- filenames.add(os.getCurrentDir())
- if optRegex notin options:
- if optWord in options:
- pattern = r"(^ / !\letter)(" & pattern & r") !\letter"
- if optIgnoreStyle in options:
- pattern = "\\y " & pattern
- elif optIgnoreCase in options:
- pattern = "\\i " & pattern
- let pegp = peg(pattern)
- for f in items(filenames):
- walker(pegp, f, counter)
- else:
- var reflags = {reStudy, reExtended}
- if optIgnoreStyle in options:
- pattern = styleInsensitive(pattern)
- if optWord in options:
- pattern = r"\b (:?" & pattern & r") \b"
- if {optIgnoreCase, optIgnoreStyle} * options != {}:
- reflags.incl reIgnoreCase
- let rep = re(pattern, reflags)
- for f in items(filenames):
- walker(rep, f, counter)
- if not oneline:
- stdout.write($counter & " matches\n")
|