r3/src/str.c

273 lines
5.6 KiB
C
Raw Normal View History

2014-05-14 22:08:42 -04:00
/*
* str.c
2014-06-27 01:24:40 -04:00
* Copyright (C) 2014 c9s <yoanlin93@gmail.com>
2014-05-14 22:08:42 -04:00
*
* Distributed under terms of the MIT license.
*/
2014-06-01 18:58:02 -04:00
#include "config.h"
2014-05-14 22:08:42 -04:00
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <assert.h>
2014-05-20 11:54:57 -04:00
#include "r3.h"
#include "r3_slug.h"
2015-11-17 08:11:12 -05:00
#include "str.h"
#include "slug.h"
#include "zmalloc.h"
2014-05-14 22:08:42 -04:00
2018-02-20 12:18:43 -05:00
static const char * strnchr(const char* str, unsigned int len, int ch) {
for (unsigned int i = 0; i < len; i++) {
if (str[i] == ch) return str + i;
}
return NULL;
}
int r3_pattern_to_opcode(const char * pattern, unsigned int len) {
2014-05-23 01:49:18 -04:00
if ( strncmp(pattern, "\\w+",len) == 0 ) {
2014-05-23 10:58:20 -04:00
return OP_EXPECT_MORE_WORDS;
}
if ( strncmp(pattern, "[0-9a-z]+",len) == 0 || strncmp(pattern, "[a-z0-9]+",len) == 0 ) {
return OP_EXPECT_MORE_WORDS;
}
if ( strncmp(pattern, "[a-z]+",len) == 0 ) {
return OP_EXPECT_MORE_ALPHA;
2014-05-22 23:25:25 -04:00
}
2014-05-23 01:49:18 -04:00
if ( strncmp(pattern, "\\d+", len) == 0 ) {
2014-05-23 10:58:20 -04:00
return OP_EXPECT_MORE_DIGITS;
}
if ( strncmp(pattern, "[0-9]+", len) == 0 ) {
return OP_EXPECT_MORE_DIGITS;
2014-05-22 23:25:25 -04:00
}
2014-05-23 01:49:18 -04:00
if ( strncmp(pattern, "[^/]+", len) == 0 ) {
2014-05-22 23:25:25 -04:00
return OP_EXPECT_NOSLASH;
}
2014-05-23 01:49:18 -04:00
if ( strncmp(pattern, "[^-]+", len) == 0 ) {
2014-05-22 23:28:19 -04:00
return OP_EXPECT_NODASH;
}
2014-05-22 23:25:25 -04:00
return 0;
}
2014-05-22 23:18:15 -04:00
2014-05-15 10:57:13 -04:00
char * r3_inside_slug(const char * needle, int needle_len, char *offset, char **errstr) {
char * s1 = offset;
char * s2 = offset;
2014-05-21 10:05:10 -04:00
short found_s1 = 0;
short found_s2 = 0;
2014-05-21 08:30:35 -04:00
while( s1 >= needle && (s1 - needle < needle_len) ) {
if ( *s1 == '{' ) {
2014-05-21 10:05:10 -04:00
found_s1 = 1;
break;
}
s1--;
}
2014-05-31 14:56:29 -04:00
const char * end = needle + needle_len;
2014-05-21 08:30:35 -04:00
while( (s2 + 1) < end ) {
if ( *s2 == '}' ) {
2014-05-21 10:05:10 -04:00
found_s2 = 1;
break;
}
s2++;
}
2014-05-21 10:05:10 -04:00
if (found_s1 && found_s2) {
return s1;
}
2014-06-01 08:51:47 -04:00
if (found_s1 || found_s2) {
// wrong slug pattern
if(errstr) {
2014-06-01 18:48:00 -04:00
asprintf(errstr, "Incomplete slug pattern");
2014-06-01 08:51:47 -04:00
}
return NULL;
}
return NULL;
}
2018-02-20 12:18:43 -05:00
const char * r3_slug_find_placeholder(const char *s1, unsigned int str_len, unsigned int *len) {
const char *c;
const char *s2;
int cnt = 0;
if ((c = strnchr(s1, str_len, '{'))) {
// find closing '}'
s2 = c;
unsigned int j = str_len - (c - s1);
for (unsigned int i = 0; i < j; i++) {
if (*s2 == '{' )
cnt++;
else if (*s2 == '}' )
cnt--;
if (cnt == 0)
break;
s2++;
}
} else {
return NULL;
}
if (cnt!=0) {
return NULL;
}
if(len) {
*len = s2 - c + 1;
}
return c;
}
/**
* given a slug string, duplicate the pattern string of the slug
*/
2018-02-20 12:18:43 -05:00
const char * r3_slug_find_pattern(const char *s1, unsigned int str_len, unsigned int *len) {
const char *c;
const char *s2;
unsigned int cnt = 1;
if ( (c = strnchr(s1, str_len, ':')) ) {
c++;
// find closing '}'
s2 = c;
unsigned int j = str_len - (c - s1);
for (unsigned int i = 0; i < j; i++) {
if (*s2 == '{' )
cnt++;
else if (*s2 == '}' )
cnt--;
if (cnt == 0)
break;
s2++;
}
} else {
return NULL;
}
if (cnt!=0) {
return NULL;
}
*len = s2 - c;
return c;
}
/**
* given a slug string, duplicate the parameter name string of the slug
*/
2018-02-20 12:18:43 -05:00
const char * r3_slug_find_name(const char *s1, unsigned int str_len, unsigned int *len) {
const char * c;
const char * s2;
unsigned int plholder;
if ((c = r3_slug_find_placeholder(s1, str_len, &plholder))) {
c++;
if (( s2 = strnchr(c, plholder, ':') )) {
*len = s2 - c;
return c;
} else {
*len = plholder - 2;
return c;
}
} else {
return NULL;
}
}
2014-05-15 08:38:07 -04:00
/**
* @param char * sep separator
*/
char * r3_slug_compile(const char * str, unsigned int len)
2014-05-15 08:38:07 -04:00
{
2018-02-20 12:18:43 -05:00
const char *s1 = NULL;
char *o = NULL;
const char *pat = NULL;
char sep = '/';
// append prefix
unsigned int s1_len;
s1 = r3_slug_find_placeholder(str, len, &s1_len);
if ( !s1 ) {
return zstrndup(str,len);
}
char * out = NULL;
if (!(out = zcalloc(sizeof(char) * 200))) {
return (NULL);
}
o = out;
2014-06-01 13:21:02 -04:00
strncat(o, "^", 1);
o++;
strncat(o, str, s1 - str); // string before slug
o += (s1 - str);
2014-05-15 08:38:07 -04:00
unsigned int pat_len;
pat = r3_slug_find_pattern(s1, s1_len, &pat_len);
if (pat) {
*o = '(';
o++;
strncat(o, pat, pat_len );
o += pat_len;
*o = ')';
o++;
2014-05-15 08:38:07 -04:00
} else {
sprintf(o, "([^%c]+)", sep);
o+= strlen("([^*]+)");
2014-05-15 08:38:07 -04:00
}
s1 += s1_len;
strncat(o, s1, len - (s1 - str)); // string after slug
return out;
2014-05-15 08:38:07 -04:00
}
2014-05-14 22:08:42 -04:00
2014-05-15 00:53:48 -04:00
char * ltrim_slash(char* str)
{
char * p = str;
while (*p == '/') p++;
return zstrdup(p);
2014-05-15 00:53:48 -04:00
}
2014-05-15 06:02:10 -04:00
void print_indent(int level) {
int len = level * 2;
while(len--) {
printf(" ");
}
}
2014-05-16 12:35:56 -04:00
2014-06-18 08:47:06 -04:00
#ifndef HAVE_STRDUP
char *zstrdup(const char *s) {
2014-05-16 12:35:56 -04:00
char *out;
2014-05-16 15:17:51 -04:00
int count = 0;
2014-05-16 12:35:56 -04:00
while( s[count] )
++count;
++count;
out = zmalloc(sizeof(char) * count);
2014-05-16 12:35:56 -04:00
out[--count] = 0;
while( --count >= 0 )
out[count] = s[count];
return out;
}
#endif
2014-05-16 12:35:56 -04:00
2014-06-18 08:47:06 -04:00
#ifndef HAVE_STRNDUP
2014-05-21 04:36:50 -04:00
char *zstrndup(const char *s, int n) {
2014-05-16 12:35:56 -04:00
char *out;
2014-05-16 15:17:51 -04:00
int count = 0;
2014-05-16 12:35:56 -04:00
while( count < n && s[count] )
++count;
++count;
out = zmalloc(sizeof(char) * count);
2014-05-16 12:35:56 -04:00
out[--count] = 0;
while( --count >= 0 )
out[count] = s[count];
return out;
}
#endif