- 论坛徽章:
- 2
|
- #include <string.h>
- int charset_in(int c, const char *set)
- {
- const unsigned char *p;
- unsigned char uc;
- int retval;
- p = (const unsigned char *)set;
- uc = (unsigned char)c;
- for (; *p != '\0'; ++p) {
- if (*p == '-') {
- ++p;
- retval = 0;
- }else {
- retval = 1;
- }
- if (*p == 'L') {
- for (++p; *p != '\0'; ++p) {
- if (*p == uc) {
- return retval;
- }
- }
- }else if (*p == 'S') {
- for (++p; *p != '\0' && *(p + 1) != '\0'; p += 2) {
- if (uc >= *p && uc <= *(p + 1)) {
- return retval;
- }
- }
- }
- }
- return 0;
- }
- int skip_text(const char *s, int *io_off, int lmt, const char *text)
- {
- int off;
- int len;
- off = *io_off;
- len = strlen(text);
- if (off + len <= lmt) {
- if (strncmp(s + off, text, len) == 0) {
- *io_off = off + len;
- return 0;
- }
- }
- return -1;
- }
- int skip_token(const char *s, int *io_off, int lmt, const char *charset)
- {
- int off;
- off = *io_off;
- if (off < lmt && charset_in(s[off], charset)) {
- do {
- ++off;
- }while (off < lmt && charset_in(s[off], charset));
- *io_off = off;
- return 0;
- }
- return -1;
- }
- int check_url_id(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (off < lmt) {
- if (charset_in(s[off], "L_\0SazAZ\0")) {
- if (skip_token(s, &off, lmt, "L_-\0SazAZ09\0") == 0) {
- *io_off = off;
- return 0;
- }
- }
- }
- return -1;
- }
- int check_urlname(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (skip_token(s, &off, lmt, "L-%\0SazAZ09\0") == 0) {
- *io_off = off;
- return 0;
- }
- return -1;
- }
- int check_portnum(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (skip_token(s, &off, lmt, "S09\0") == 0) {
- *io_off = off;
- return 0;
- }
- return -1;
- }
- int check_urlpath(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- while (skip_text(s, &off, lmt, "/") == 0
- && check_urlname(s, &off, lmt) == 0) {
- }
- *io_off = off;
- return 0;
- }
- int check_urlparam_item(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (check_urlname(s, &off, lmt) == 0) {
- if (skip_text(s, &off, lmt, "=") == 0) {
- if (check_urlname(s, &off, lmt) == 0) {
- *io_off = off;
- return 0;
- }
- }else {
- *io_off = off;
- return 0;
- }
- }
- return -1;
- }
- int check_urlparam(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (skip_text(s, &off, lmt, "?") == 0) {
- if (check_urlparam_item(s, &off, lmt) == 0) {
- while (skip_text(s, &off, lmt, "&") == 0
- && check_urlparam_item(s, &off, lmt) == 0) {
- }
- }
- }
- *io_off = off;
- return 0;
- }
- int check_urltag(const char *s, int *io_off, int lmt)
- {
- int off;
- off = *io_off;
- if (skip_text(s, &off, lmt, "#") == 0) {
- check_url_id(s, &off, lmt);
- }
- *io_off = off;
- return 0;
- }
- int check_url(const char *url, int url_len)
- {
- int off;
- off = 0;
- if (check_url_id(url, &off, url_len) == 0) {
- if (skip_text(url, &off, url_len, "://") == 0) {
- if (check_urlname(url, &off, url_len) == 0) {
- if (skip_text(url, &off, url_len, ":") == 0) {
- if (check_urlname(url, &off, url_len) == 0) {
- if (skip_text(url, &off, url_len, "@") == 0) {
- if (check_urlname(url, &off, url_len) == 0) {
- while (skip_text(url, &off, url_len, ".") == 0
- && check_urlname(url, &off, url_len) == 0) {
- }
- if (skip_text(url, &off, url_len, ":") == 0) {
- check_portnum(url, &off, url_len);
- }
- check_urlpath(url, &off, url_len);
- check_urlparam(url, &off, url_len);
- check_urltag(url, &off, url_len);
- if (off == url_len) {
- return 0;
- }
- }
- }
- }
- }else if (skip_text(url, &off, url_len, "@") == 0) {
- if (check_urlname(url, &off, url_len) == 0) {
- while (skip_text(url, &off, url_len, ".") == 0
- && check_urlname(url, &off, url_len) == 0) {
- }
- if (skip_text(url, &off, url_len, ":") == 0) {
- check_portnum(url, &off, url_len);
- }
- check_urlpath(url, &off, url_len);
- check_urlparam(url, &off, url_len);
- check_urltag(url, &off, url_len);
- if (off == url_len) {
- return 0;
- }
- }
- }else {
- while (skip_text(url, &off, url_len, ".") == 0
- && check_urlname(url, &off, url_len) == 0) {
- }
- if (skip_text(url, &off, url_len, ":") == 0) {
- check_portnum(url, &off, url_len);
- }
- check_urlpath(url, &off, url_len);
- check_urlparam(url, &off, url_len);
- check_urltag(url, &off, url_len);
- if (off == url_len) {
- return 0;
- }
- }
- }
- }
- }
- return -1;
- }
- /* TESTING */
- #define LENGTH(a) (sizeof(a)/sizeof((a)[0]))
- #include <stdio.h>
- int main(void)
- {
- struct url_example {
- const char *url_text;
- int result;
- }url_examples[] = {
- "http://abc@aa1.com:368?a=123&b=456#kkk", 0,
- "http://abc.aa1.com:368?a=123&b=456#kkk", 0,
- "http://abc@abc.aa1.com?a=123&b=456#kkk", 0,
- "http://abc.aa1.com", 0,
- "ftp://user:password@abc.aa1.com:22", 0,
- "http://123@abc.aa1.com#kk", 0,
- "http://abc@aa-bb.net:387?a=23343&b=%2f#kslkj", 0,
- "http://abc@aa-bb.net:3a87?a=23343&b=%2f#kslkj", -1,
- "http-ftp@://www.sina.com", -1,
- };
- int i;
- int retval;
- for (i = 0; i < LENGTH(url_examples); ++i) {
- fputs(url_examples[i].url_text, stdout);
- retval = check_url(url_examples[i].url_text, strlen(url_examples[i].url_text));
- if (url_examples[i].result == 0) {
- fputs(" => CORRECT TESTING... ", stdout);
- }else {
- fputs(" => WRONG TESTING... ", stdout);
- }
- if (retval == url_examples[i].result) {
- puts("PASSED");
- }else {
- puts("FAILED");
- }
- }
- return 0;
- }
复制代码 |
|