最常想到的方法是使用KMP字符串匹配算法:
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
|
#include <stdio.h> #include <stdlib.h> #include <string.h> int get_nextval( char *pattern, int next[]) { //get the next value of the pattern int i = 0, j = -1; next[0] = -1; int patlen = strlen (pattern); while ( i < patlen - 1){ if ( j == -1 || pattern[i] == pattern[j]){ ++i; ++j; if (pattern[i] != pattern[j]) next[i] = j; else next[i] = next[j]; } else j = next[j]; } return (0); } int kmpindex( char *target, char *pattern, int pos) { int tari = pos, pati = 0; int tarlen = strlen (target), patlen = strlen (pattern); int *next = ( int *) malloc (patlen * sizeof ( int )); get_nextval(pattern, next); while ( tari < tarlen && pati < patlen ){ if (pati == -1 ||target[tari] == pattern[pati]){ ++tari; ++pati; } else { pati = next[pati]; } } if (next != NULL) free (next); next = NULL; if (pati == patlen) return tari - pati; else return -1; } int main() { char target[50], pattern[50]; printf ( "imput the target:\n" ); scanf ( "%s" ,target); printf ( "imput the pattern:\n" ); scanf ( "%s" ,pattern); int ans = kmpindex(target,pattern,0); if (ans == -1) printf ( "error\n" ); else printf ( "index:%d\n" ,ans); return 0; } |
练习题
题目描述:
读入数据string[ ],然后读入一个短字符串。要求查找string[ ]中和短字符串的所有匹配,输出行号、匹配字符串。匹配时不区分大小写,并且可以有一个用中括号表示的模式匹配。如“aa[123]bb”,就是说aa1bb、aa2bb、aa3bb都算匹配。
输入:
输入有多组数据。
每组数据第一行输入n(1<=n<=1000),从第二行开始输入n个字符串(不含空格),接下来输入一个匹配字符串。
输出:
输出匹配到的字符串的行号和该字符串(匹配时不区分大小写)。
样例输入:
4
Aab
a2B
ab
ABB
a[a2b]b
样例输出:
1 Aab
2 a2B
4 ABB
ac代码
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
|
#include <stdio.h> #include <stdlib.h> #include <string.h> #define MAX 1001 #define LEN 101 struct str { char name[101]; }; int main() { struct str strs[MAX]; struct str t[LEN]; int i, n, len, j, k, left, right, count, flag; char text[LEN], newtext[LEN]; while ( scanf ( "%d" , &n) != EOF) { // 接收数据 getchar (); for (i = 0; i < n; i ++) { scanf ( "%s" , strs[i].name); } // 接收文本串 getchar (); gets (text); len = strlen (text); for (i = left = right = 0; i < len; i ++) { if (text[i] == '[' ) { left = i; } else if (text[i] == ']' ) { right = i; break ; } } count = right - left - 1; if (count <= 0) { // 没有正则匹配 for (i = j = 0; i < len; i ++) { if (text[i] != '[' && text[i] != ']' ) { newtext[j ++] = text[i]; } } newtext[j] = '\0' ; for (i = 0; i < n; i ++) { if (strcasecmp(strs[i].name, newtext) == 0) { printf ( "%d %s\n" , i + 1, strs[i].name); } } } else { // 需要正则匹配 for (j = 1, k = 0; j <= count; j ++, k ++) { // 构建文本数组 memset (t[k].name, '\0' , sizeof (t[k].name)); for (i = 0; i < left; i ++) { t[k].name[i] = text[i]; } t[k].name[i] = text[left + j]; strcat (t[k].name, text + right + 1); } // 正则匹配 for (i = 0; i < n; i ++) { for (j = flag = 0; j < count; j ++) { if (strcasecmp(strs[i].name, t[j].name) == 0) { flag = 1; break ; } } if (flag) { printf ( "%d %s\n" , i + 1, strs[i].name); } } } } return 0; } |
/**************************************************************
Problem: 1165
User: wangzhengyi
Language: C
Result: Accepted
Time:0 ms
Memory:948 kb
****************************************************************/