|  | #include "git-compat-util.h" | 
|  | #include "line-range.h" | 
|  | #include "xdiff-interface.h" | 
|  | #include "strbuf.h" | 
|  | #include "userdiff.h" | 
|  |  | 
|  | /* | 
|  | * Parse one item in the -L option | 
|  | * | 
|  | * 'begin' is applicable only to relative range anchors. Absolute anchors | 
|  | * ignore this value. | 
|  | * | 
|  | * When parsing "-L A,B", parse_loc() is called once for A and once for B. | 
|  | * | 
|  | * When parsing A, 'begin' must be a negative number, the absolute value of | 
|  | * which is the line at which relative start-of-range anchors should be | 
|  | * based. Beginning of file is represented by -1. | 
|  | * | 
|  | * When parsing B, 'begin' must be the positive line number immediately | 
|  | * following the line computed for 'A'. | 
|  | */ | 
|  | static const char *parse_loc(const char *spec, nth_line_fn_t nth_line, | 
|  | void *data, long lines, long begin, long *ret) | 
|  | { | 
|  | char *term; | 
|  | const char *line; | 
|  | long num; | 
|  | int reg_error; | 
|  | regex_t regexp; | 
|  | regmatch_t match[1]; | 
|  |  | 
|  | /* Allow "-L <something>,+20" to mean starting at <something> | 
|  | * for 20 lines, or "-L <something>,-5" for 5 lines ending at | 
|  | * <something>. | 
|  | */ | 
|  | if (1 <= begin && (spec[0] == '+' || spec[0] == '-')) { | 
|  | num = strtol(spec + 1, &term, 10); | 
|  | if (term != spec + 1) { | 
|  | if (!ret) | 
|  | return term; | 
|  | if (num == 0) | 
|  | die("-L invalid empty range"); | 
|  | if (spec[0] == '-') | 
|  | num = 0 - num; | 
|  | if (0 < num) | 
|  | *ret = begin + num - 2; | 
|  | else if (!num) | 
|  | *ret = begin; | 
|  | else | 
|  | *ret = begin + num > 0 ? begin + num : 1; | 
|  | return term; | 
|  | } | 
|  | return spec; | 
|  | } | 
|  | num = strtol(spec, &term, 10); | 
|  | if (term != spec) { | 
|  | if (ret) { | 
|  | if (num <= 0) | 
|  | die("-L invalid line number: %ld", num); | 
|  | *ret = num; | 
|  | } | 
|  | return term; | 
|  | } | 
|  |  | 
|  | if (begin < 0) { | 
|  | if (spec[0] != '^') | 
|  | begin = -begin; | 
|  | else { | 
|  | begin = 1; | 
|  | spec++; | 
|  | } | 
|  | } | 
|  |  | 
|  | if (spec[0] != '/') | 
|  | return spec; | 
|  |  | 
|  | /* it could be a regexp of form /.../ */ | 
|  | for (term = (char *) spec + 1; *term && *term != '/'; term++) { | 
|  | if (*term == '\\') | 
|  | term++; | 
|  | } | 
|  | if (*term != '/') | 
|  | return spec; | 
|  |  | 
|  | /* in the scan-only case we are not interested in the regex */ | 
|  | if (!ret) | 
|  | return term+1; | 
|  |  | 
|  | /* try [spec+1 .. term-1] as regexp */ | 
|  | *term = 0; | 
|  | begin--; /* input is in human terms */ | 
|  | line = nth_line(data, begin); | 
|  |  | 
|  | if (!(reg_error = regcomp(®exp, spec + 1, REG_NEWLINE)) && | 
|  | !(reg_error = regexec(®exp, line, 1, match, 0))) { | 
|  | const char *cp = line + match[0].rm_so; | 
|  | const char *nline; | 
|  |  | 
|  | while (begin++ < lines) { | 
|  | nline = nth_line(data, begin); | 
|  | if (line <= cp && cp < nline) | 
|  | break; | 
|  | line = nline; | 
|  | } | 
|  | *ret = begin; | 
|  | regfree(®exp); | 
|  | *term++ = '/'; | 
|  | return term; | 
|  | } | 
|  | else { | 
|  | char errbuf[1024]; | 
|  | regerror(reg_error, ®exp, errbuf, 1024); | 
|  | die("-L parameter '%s' starting at line %ld: %s", | 
|  | spec + 1, begin + 1, errbuf); | 
|  | } | 
|  | } | 
|  |  | 
|  | static int match_funcname(xdemitconf_t *xecfg, const char *bol, const char *eol) | 
|  | { | 
|  | if (xecfg) { | 
|  | char buf[1]; | 
|  | return xecfg->find_func(bol, eol - bol, buf, 1, | 
|  | xecfg->find_func_priv) >= 0; | 
|  | } | 
|  |  | 
|  | if (bol == eol) | 
|  | return 0; | 
|  | if (isalpha(*bol) || *bol == '_' || *bol == '$') | 
|  | return 1; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | static const char *find_funcname_matching_regexp(xdemitconf_t *xecfg, const char *start, | 
|  | regex_t *regexp) | 
|  | { | 
|  | int reg_error; | 
|  | regmatch_t match[1]; | 
|  | while (1) { | 
|  | const char *bol, *eol; | 
|  | reg_error = regexec(regexp, start, 1, match, 0); | 
|  | if (reg_error == REG_NOMATCH) | 
|  | return NULL; | 
|  | else if (reg_error) { | 
|  | char errbuf[1024]; | 
|  | regerror(reg_error, regexp, errbuf, 1024); | 
|  | die("-L parameter: regexec() failed: %s", errbuf); | 
|  | } | 
|  | /* determine extent of line matched */ | 
|  | bol = start+match[0].rm_so; | 
|  | eol = start+match[0].rm_eo; | 
|  | while (bol > start && *bol != '\n') | 
|  | bol--; | 
|  | if (*bol == '\n') | 
|  | bol++; | 
|  | while (*eol && *eol != '\n') | 
|  | eol++; | 
|  | if (*eol == '\n') | 
|  | eol++; | 
|  | /* is it a funcname line? */ | 
|  | if (match_funcname(xecfg, (char*) bol, (char*) eol)) | 
|  | return bol; | 
|  | start = eol; | 
|  | } | 
|  | } | 
|  |  | 
|  | static const char *parse_range_funcname( | 
|  | const char *arg, nth_line_fn_t nth_line_cb, | 
|  | void *cb_data, long lines, long anchor, long *begin, long *end, | 
|  | const char *path, struct index_state *istate) | 
|  | { | 
|  | char *pattern; | 
|  | const char *term; | 
|  | struct userdiff_driver *drv; | 
|  | xdemitconf_t *xecfg = NULL; | 
|  | const char *start; | 
|  | const char *p; | 
|  | int reg_error; | 
|  | regex_t regexp; | 
|  |  | 
|  | if (*arg == '^') { | 
|  | anchor = 1; | 
|  | arg++; | 
|  | } | 
|  |  | 
|  | assert(*arg == ':'); | 
|  | term = arg+1; | 
|  | while (*term && *term != ':') { | 
|  | if (*term == '\\' && *(term+1)) | 
|  | term++; | 
|  | term++; | 
|  | } | 
|  | if (term == arg+1) | 
|  | return NULL; | 
|  | if (!begin) /* skip_range_arg case */ | 
|  | return term; | 
|  |  | 
|  | pattern = xstrndup(arg+1, term-(arg+1)); | 
|  |  | 
|  | anchor--; /* input is in human terms */ | 
|  | start = nth_line_cb(cb_data, anchor); | 
|  |  | 
|  | drv = userdiff_find_by_path(istate, path); | 
|  | if (drv && drv->funcname.pattern) { | 
|  | const struct userdiff_funcname *pe = &drv->funcname; | 
|  | xecfg = xcalloc(1, sizeof(*xecfg)); | 
|  | xdiff_set_find_func(xecfg, pe->pattern, pe->cflags); | 
|  | } | 
|  |  | 
|  | reg_error = regcomp(®exp, pattern, REG_NEWLINE); | 
|  | if (reg_error) { | 
|  | char errbuf[1024]; | 
|  | regerror(reg_error, ®exp, errbuf, 1024); | 
|  | die("-L parameter '%s': %s", pattern, errbuf); | 
|  | } | 
|  |  | 
|  | p = find_funcname_matching_regexp(xecfg, (char*) start, ®exp); | 
|  | if (!p) | 
|  | die("-L parameter '%s' starting at line %ld: no match", | 
|  | pattern, anchor + 1); | 
|  | *begin = 0; | 
|  | while (p > nth_line_cb(cb_data, *begin)) | 
|  | (*begin)++; | 
|  |  | 
|  | if (*begin >= lines) | 
|  | die("-L parameter '%s' matches at EOF", pattern); | 
|  |  | 
|  | *end = *begin+1; | 
|  | while (*end < lines) { | 
|  | const char *bol = nth_line_cb(cb_data, *end); | 
|  | const char *eol = nth_line_cb(cb_data, *end+1); | 
|  | if (match_funcname(xecfg, bol, eol)) | 
|  | break; | 
|  | (*end)++; | 
|  | } | 
|  |  | 
|  | regfree(®exp); | 
|  | free(xecfg); | 
|  | free(pattern); | 
|  |  | 
|  | /* compensate for 1-based numbering */ | 
|  | (*begin)++; | 
|  |  | 
|  | return term; | 
|  | } | 
|  |  | 
|  | int parse_range_arg(const char *arg, nth_line_fn_t nth_line_cb, | 
|  | void *cb_data, long lines, long anchor, | 
|  | long *begin, long *end, | 
|  | const char *path, struct index_state *istate) | 
|  | { | 
|  | *begin = *end = 0; | 
|  |  | 
|  | if (anchor < 1) | 
|  | anchor = 1; | 
|  | if (anchor > lines) | 
|  | anchor = lines + 1; | 
|  |  | 
|  | if (*arg == ':' || (*arg == '^' && *(arg + 1) == ':')) { | 
|  | arg = parse_range_funcname(arg, nth_line_cb, cb_data, | 
|  | lines, anchor, begin, end, | 
|  | path, istate); | 
|  | if (!arg || *arg) | 
|  | return -1; | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | arg = parse_loc(arg, nth_line_cb, cb_data, lines, -anchor, begin); | 
|  |  | 
|  | if (*arg == ',') | 
|  | arg = parse_loc(arg + 1, nth_line_cb, cb_data, lines, *begin + 1, end); | 
|  |  | 
|  | if (*arg) | 
|  | return -1; | 
|  |  | 
|  | if (*begin && *end && *end < *begin) { | 
|  | SWAP(*end, *begin); | 
|  | } | 
|  |  | 
|  | return 0; | 
|  | } | 
|  |  | 
|  | const char *skip_range_arg(const char *arg, struct index_state *istate) | 
|  | { | 
|  | if (*arg == ':' || (*arg == '^' && *(arg + 1) == ':')) | 
|  | return parse_range_funcname(arg, NULL, NULL, | 
|  | 0, 0, NULL, NULL, | 
|  | NULL, istate); | 
|  |  | 
|  | arg = parse_loc(arg, NULL, NULL, 0, -1, NULL); | 
|  |  | 
|  | if (*arg == ',') | 
|  | arg = parse_loc(arg+1, NULL, NULL, 0, 0, NULL); | 
|  |  | 
|  | return arg; | 
|  | } |