POSIX正则表达式不匹配

POSIX regex not matching

本文关键字:不匹配 正则表达式 POSIX      更新时间:2023-10-16

这是我第一次尝试POSIX正则表达式。我尝试了下面的代码,但没有得到预期的结果。我需要从字符串中单独获取数字。我在Linux Mint上运行代码,用g++ 4.7.2编译

#include <stdio.h>
#include <strings.h>
#include <regex.h>
int main()
{
    int ret;
    char string[512] = "Odd:97531|Even:86420";
    regex_t pattern;
    ret = regcomp(&pattern, "[0-9]*", REG_EXTENDED);
    if(ret < 0) 
    { 
        char err[512] = {};
        regerror(ret, &pattern, err, 500);
        printf("Regex compile error : %sn", err);
        return -1;
    }
    else
    {
        printf("Number of subexpression : %dn", pattern.re_nsub);
    }
    int nmatch = 5;
    regmatch_t match[5];
    ret = regexec(&pattern, string, nmatch, match, 0);
    if(ret < 0)
    {
        char err[512] = {};
        regerror(ret, &pattern, err, 500);
        printf("Regex execute error : %sn", err);
        return -2;
    }
    else
    {
        printf("Number of subexpression : %dn", pattern.re_nsub);
        for(int I = 0; I < nmatch; I++)
            printf("Match %02d : %.*s (%d to %d)n", I + 1, 
            match[I].rm_eo - match[I].rm_so, string + match[I].rm_so, 
            match[I].rm_so, match[I].rm_eo);
    }
    return 0;
}

输出
Number of subexpression : 0
Number of subexpression : 0
Match 01 :  (0 to 0)
Match 02 :  (-1 to -1)
Match 03 :  (-1 to -1)
Match 04 :  (-1 to -1)
Match 05 :  (-1 to -1)

我做错了什么?谁来帮帮我。

[0-9]*匹配 0个或多个十进制数字。显然,字符串的开头是匹配的。您可能需要[0-9]+,它代表一个或多个十进制数字。

此外,为了多次匹配相同的模式,您需要以不同的偏移量多次调用regexec()nmatch是针对regex中的不同括号,而不是针对多次匹配。

完整的精炼代码如下:

int main()
{
    int ret;
    char string[512] = "Odd:97531|Even:86420";
    regex_t pattern;
    ret = regcomp(&pattern, "[0-9]+", REG_EXTENDED);
    if(ret != 0)
    {
        char err[512] = {};
        regerror(ret, &pattern, err, 500);
        printf("Regex compile error : %sn", err);
        return -1;
    }
    else
    {
        printf("Number of subexpression : %dn", pattern.re_nsub);
    }
    regmatch_t match;
    char *notmatched = string;
    for (int I = 1; regexec(&pattern, notmatched, 1, &match, 0) == 0; ++I) {
        printf("Match %02d : %.*s (%d to %d)n", I,
                match.rm_eo - match.rm_so, notmatched + match.rm_so,
                match.rm_so, match.rm_eo);
        notmatched += match.rm_eo;
    }
    return 0;
}