proxy: begin transition from regex to parslib

This commit is contained in:
Kevin J. 2024-09-08 22:00:58 +02:00
parent 1bc58618e5
commit 718a040d15
6 changed files with 181 additions and 254 deletions

3
.gitmodules vendored Normal file
View File

@ -0,0 +1,3 @@
[submodule "parslib"]
path = parslib
url = http://git.0xdeadbeer.xyz/0xdeadbeer/parslib

View File

@ -1,14 +1,16 @@
CC=bear --append -- gcc CC=bear --append -- gcc
CFLAGS= -g3 -Wall -Werror CFLAGS= -g3 -Wall -Werror
CFILES=proxlib.c
CFILES_PARSLIB=parslib/parslib.final.o
OUT=proxlib
all: proxlib all: proxlib
proxy: proxlib.c proxlib: $(CFILES) $(CFILES_PARSLIB)
$(CC) $(CFLAGS) -o proxlib.o -c proxlib.c $(CC) $(CFLAGS) -o $(OUT) $^
$(CC) $(CFLAGS) -o proxlib proxlib.o
clean: clean:
rm -f proxlib *.o rm -f $(OUT)
tar: tar:
tar -cvzf proxlib.tgz proxlib.c proxlib.h README Makefile tar -cvzf proxlib.tgz $(CFILES) README Makefile

1
parslib Submodule

@ -0,0 +1 @@
Subproject commit 678a44228fe0c5b24b2d1b96576da0e44211c364

BIN
proxlib

Binary file not shown.

369
proxlib.c
View File

@ -7,194 +7,99 @@
#include <arpa/inet.h> #include <arpa/inet.h>
#include <netinet/in.h> #include <netinet/in.h>
#include <netdb.h> #include <netdb.h>
#include <regex.h>
#include "proxlib.h" #include "proxlib.h"
#include "parslib/parslib.h"
int on = 1; int on = 1;
int debug = 1; int debug = 2;
struct request *clt_data; struct request *clt_data;
regex_t preg;
regmatch_t pmatch[REGEX_MATCHN];
int statem; int statem;
int clt_sock = -1; int clt_sock = -1;
int srv_sock = -1; int srv_sock = -1;
char *clt_msg = NULL;
char *srv_msg = NULL;
int clt_msg_len = 0;
int srv_msg_len = 0;
void *extractsub(const char *msg, regmatch_t match) { #define SEGMENT_LEN 512
void *buf = NULL; #define MAX_BUFF_LEN 128 * 1024
int buflen = match.rm_eo - match.rm_so; int _read_line(int fd, char **outbuff) {
if (!buflen) char tmp_buff[SEGMENT_LEN];
goto _return; int tmp_buff_len = 0;
char *output_buff = NULL;
int output_buff_len = 0;
char *ptr = NULL;
int whead_pos = 0;
char *whead = NULL;
int diff = 0;
int ret = 0;
int end = 0;
buf = (void *) calloc(1, buflen); while (!end) {
if (buf == NULL) ret = recv(fd, tmp_buff, SEGMENT_LEN, MSG_PEEK);
goto _return; if (ret <= 0) {
break;
sprintf(buf, "%.*s", buflen, &msg[match.rm_so]);
_return:
return buf;
} }
int parse_header(char *msgbuff) { ptr = strstr(tmp_buff, "\r\n");
int ret; if (ptr >= tmp_buff+SEGMENT_LEN) {
diff = ret;
} else {
diff = ptr - tmp_buff + 2;
end = 1;
}
ret = regcomp(&preg, REGEX_HEADER, REG_EXTENDED); tmp_buff_len = diff;
if (ret != 0) whead_pos = output_buff_len;
goto _err; output_buff_len += tmp_buff_len;
ret = regexec(&preg, msgbuff, REGEX_MATCHN, pmatch, 0); if (tmp_buff_len > MAX_BUFF_LEN) {
if (ret != 0)
goto _ok;
char *key = extractsub(msgbuff, pmatch[1]);
if (key == NULL)
goto _err;
char *value = extractsub(msgbuff, pmatch[2]);
if (value == NULL)
goto _err;
struct header new_header = {
.key = key,
.value = value
};
int last_index = clt_data->header_num;
clt_data->header_num++;
clt_data->headers = (void *) realloc(clt_data->headers,
clt_data->header_num*sizeof(struct header));
clt_data->headers[last_index] = new_header;
_ok:
regfree(&preg);
return 0;
_err:
regfree(&preg);
return -1; return -1;
} }
int parse_host(char *buff) { output_buff = (char *) realloc(output_buff, output_buff_len);
int ret; if (!output_buff) {
ret = regcomp(&preg, REGEX_HOST, REG_EXTENDED);
if (ret != 0)
goto _err;
ret = regexec(&preg, buff, REGEX_MATCHN, pmatch, 0);
if (ret != 0)
goto _err;
char *host_name = extractsub(buff, pmatch[1]);
if (!host_name)
goto _err;
char *host_port = extractsub(buff, pmatch[2]);
if (!host_port) {
host_port = PROXY_DEF_PORT;
}
clt_data->host_name = host_name;
clt_data->host_port = host_port;
regfree(&preg);
return 0;
_err:
regfree(&preg);
return -1; return -1;
} }
int parse_title(char *msgbuff) { whead = output_buff+whead_pos;
int ret; ret = recv(fd, whead, diff, 0);
if (ret <= 0) {
break;
}
}
ret = regcomp(&preg, REGEX_TITLE, REG_EXTENDED); *outbuff = output_buff;
if (ret != 0) return output_buff_len;
goto _err; }
ret = regexec(&preg, msgbuff, REGEX_MATCHN, pmatch, 0); /* easy wrapper for _read_line(int fd, void **outbuff) */
if (ret != 0) int read_line(int fd,
goto _err; int *line_len, char **line,
int *msgbuff_len, char **msgbuff) {
int ret = 0;
clt_data->method = extractsub(msgbuff, pmatch[1]); ret = *line_len = _read_line(fd, line);
if (clt_data->method == NULL) if (ret < 0) {
goto _err;
clt_data->uri = extractsub(msgbuff, pmatch[2]);
if (clt_data->uri == NULL)
goto _err;
clt_data->ver = extractsub(msgbuff, pmatch[3]);
if (clt_data->ver == NULL)
goto _err;
regfree(&preg);
return 0;
_err:
regfree(&preg);
return -1; return -1;
} }
void free_host(void) { *msgbuff = (char *) realloc(*msgbuff, *msgbuff_len+*line_len);
free(clt_data->host_name); if (!*msgbuff) {
free(clt_data->host_port); free(*line);
return -1;
} }
void free_title(void) { memcpy(*msgbuff+*msgbuff_len, *line, *line_len);
free(clt_data->method);
free(clt_data->uri);
free(clt_data->ver);
}
void free_headers(void) { *msgbuff_len += *line_len;
for (int i = 0; i < clt_data->header_num; i++) { ((char *) *line)[(*line_len)-2] = '\0';
struct header *header = &clt_data->headers[i]; *line_len -= 2;
free(header->key);
free(header->value);
}
free(clt_data->headers);
}
void free_clt_data(void) { return 0;
free_host();
free_title();
free_headers();
free(clt_data);
}
void free_srv_data(void) {
}
void free_msg_buffs(void) {
free(clt_msg);
free(srv_msg);
}
void free_data(void) {
free_clt_data();
free_srv_data();
} }
int parse_line(char *line, int line_count) { int parse_line(char *line, int line_count) {
int ret = 0; int ret = 0;
if (line_count == 0) {
ret = parse_title(line);
} else {
ret = parse_header(line);
}
return ret; return ret;
} }
@ -218,7 +123,7 @@ void do_err(void) {
} }
int do_fwd_clt(void) { int do_fwd_clt(void) {
int bytes = 0; /*int bytes = 0;
int ret = 0; int ret = 0;
while (bytes < srv_msg_len) { while (bytes < srv_msg_len) {
ret = write(clt_sock, srv_msg+bytes, srv_msg_len-bytes); ret = write(clt_sock, srv_msg+bytes, srv_msg_len-bytes);
@ -226,7 +131,7 @@ int do_fwd_clt(void) {
return -1; return -1;
bytes += ret; bytes += ret;
} }*/
return 0; return 0;
} }
@ -238,7 +143,7 @@ int do_prs_srv(void) {
} }
int do_rcv_srv(void) { int do_rcv_srv(void) {
int bytes = 0; /*int bytes = 0;
int ret = 0; int ret = 0;
while (bytes < PROXY_MAX_MSGLEN) { while (bytes < PROXY_MAX_MSGLEN) {
ret = recv(srv_sock, srv_msg+bytes, PROXY_MAX_MSGLEN-bytes, MSG_PEEK); ret = recv(srv_sock, srv_msg+bytes, PROXY_MAX_MSGLEN-bytes, MSG_PEEK);
@ -253,21 +158,18 @@ int do_rcv_srv(void) {
srv_msg_len = bytes; srv_msg_len = bytes;
if (debug) if (debug == 1)
fprintf(stdout, "[%d] Received server message of size %d bytes\n", statem, srv_msg_len); fprintf(stdout, "[%d] Received server message of size %d bytes\n", statem, srv_msg_len);
*/
return 0; return 0;
} }
// TODO
int do_con_srv(void) { int do_con_srv(void) {
int ret; int ret;
char *host = getheader("Host");
if (!host)
return -1;
ret = parse_host(host); // MISSING HOST
if (ret < 0)
return -1;
struct addrinfo hints; struct addrinfo hints;
struct addrinfo *res; struct addrinfo *res;
@ -293,7 +195,7 @@ int do_con_srv(void) {
} }
int do_fwd_srv(void) { int do_fwd_srv(void) {
int bytes = 0; /*int bytes = 0;
int ret = 0; int ret = 0;
while (bytes < clt_msg_len) { while (bytes < clt_msg_len) {
ret = write(srv_sock, clt_msg+bytes, clt_msg_len-bytes); ret = write(srv_sock, clt_msg+bytes, clt_msg_len-bytes);
@ -301,96 +203,101 @@ int do_fwd_srv(void) {
return -1; return -1;
bytes += ret; bytes += ret;
} }*/
return 0; return 0;
} }
int do_prs_clt(void) { int do_rcv_clt(struct conn *conn) {
int ret;
int ln_cnt = 0;
char *ln = strdup(clt_msg);
if (!ln)
return -1;
ln = strtok(ln, "\n");
while (ln) {
ret = parse_line(ln, ln_cnt);
if (ret < 0)
return -1;
ln_cnt++;
ln = strtok(NULL, "\n");
}
return 0;
}
int do_rcv_clt(void) {
int bytes = 0;
int ret = 0; int ret = 0;
while (bytes < PROXY_MAX_MSGLEN) { char *line = NULL;
ret = recv(clt_sock, clt_msg+bytes, PROXY_MAX_MSGLEN-bytes, MSG_PEEK); char *msgbuff = NULL;
if (ret < 0) int line_len = 0;
int msgbuff_len = 0;
// request line
ret = read_line(conn->cltfd, &line_len, &line, &msgbuff_len, &msgbuff);
if (ret < 0) {
fprintf(stderr, "Failed receiving request line\n");
return -1; return -1;
if (!ret)
break;
ret = recv(clt_sock, clt_msg+bytes, PROXY_MAX_MSGLEN-bytes, 0);
bytes += ret;
} }
clt_msg_len = bytes; if (debug == 1) {
fprintf(stdout, "debug - received line: %s\n", line);
if (debug)
fprintf(stdout, "[%d] Received client message of size %d bytes\n", statem, clt_msg_len);
return 0;
} }
int do_alloc(void) { ret = pareqtitl(line, line_len, &(conn->cltreq.titl));
clt_msg = (char *) calloc(1, PROXY_MAX_MSGLEN); if (ret < 0) {
if (!clt_msg) fprintf(stderr, "Failed parsing request line\n");
return -1; return -1;
}
srv_msg = (char *) calloc(1, PROXY_MAX_MSGLEN); if (debug == 1) {
if (!srv_msg) fprintf(stdout, "debug - parsed request line\n");
return -1; }
clt_data = (struct request *) calloc(1, sizeof(struct request)); free(line);
if (!clt_data)
// headers
int next_header = 1;
while (next_header) {
ret = read_line(conn->cltfd, &line_len, &line, &msgbuff_len, &msgbuff);
if (ret < 0) {
fprintf(stderr, "Failed receiving header line\n");
return -1; return -1;
}
if (line_len == 0) {
if (debug == 1) {
fprintf(stdout, "debug - reached end of headers\n");
}
next_header = 0;
continue;
}
if (debug == 1) {
fprintf(stdout, "debug - received line: %s\n", line);
}
ret = parshfield(line, line_len, conn->cltreq.hentries);
if (ret < 0) {
fprintf(stderr, "Failed parsing header field\n");
return -1;
}
if (debug == 1) {
fprintf(stdout, "debug - parsed header field\n");
}
free(line);
}
if (debug <= 2) {
fprintf(stdout, "printing parsed request\n");
printfpareq(&conn->cltreq);
}
return 0; return 0;
} }
void do_clear(void) { void do_clear(void) {
statem = STATEM_RCV_CLT; statem = STATEM_RCV_CLT;
memset(clt_msg, 0, PROXY_MAX_MSGLEN);
memset(srv_msg, 0, PROXY_MAX_MSGLEN);
memset(clt_data, 0, sizeof(struct request));
clt_msg_len = 0;
srv_msg_len = 0;
} }
void do_statem() { void do_statem() {
int ret = do_alloc(); int ret = 0;
if (ret < 0) { struct conn *conn = (struct conn *) calloc(1, sizeof(struct conn));
do_err(); if (!conn) {
fprintf(stderr, "Not enough dynamic memory to establish connection\n");
return; return;
} }
conn->cltfd = clt_sock;
for (int counter = 0; counter < MAX_BOUND; counter++) { for (int counter = 0; counter < MAX_BOUND; counter++) {
switch (statem & (~STATEM_ERR)) { switch (statem & (~STATEM_ERR)) {
case STATEM_RCV_CLT: case STATEM_RCV_CLT:
ret = do_rcv_clt(); ret = do_rcv_clt(conn);
break;
case STATEM_PRS_CLT:
ret = do_prs_clt();
break; break;
case STATEM_CON_SRV: case STATEM_CON_SRV:
ret = do_con_srv(); ret = do_con_srv();
@ -401,9 +308,6 @@ void do_statem() {
case STATEM_RCV_SRV: case STATEM_RCV_SRV:
ret = do_rcv_srv(); ret = do_rcv_srv();
break; break;
case STATEM_PRS_SRV:
ret = do_prs_srv();
break;
case STATEM_FWD_CLT: case STATEM_FWD_CLT:
ret = do_fwd_clt(); ret = do_fwd_clt();
break; break;
@ -428,8 +332,7 @@ void do_statem() {
statem <<= 1; statem <<= 1;
} }
free_msg_buffs(); free(conn);
free_data();
} }
void dohelp() { void dohelp() {
@ -566,6 +469,12 @@ int main(int argc, char *argv[]) {
return 0; return 0;
} }
ret = initres();
if (ret < 0) {
fprintf(stderr, "Failed generating trees\n");
return -1;
}
const char *mode = argv[1]; const char *mode = argv[1];
ret = strcmp(mode, SERVER_MODE); ret = strcmp(mode, SERVER_MODE);
if (ret == 0) if (ret == 0)
@ -576,4 +485,6 @@ int main(int argc, char *argv[]) {
return do_clt(); return do_clt();
fprintf(stderr, "Unknown proxy mode\n"); fprintf(stderr, "Unknown proxy mode\n");
fretres();
} }

View File

@ -1,7 +1,11 @@
#ifndef STRUCTS_H #ifndef STRUCTS_H
#define STRUCTS_H #define STRUCTS_H
#include "parslib/parslib.h"
#ifndef MAX_BOUND
#define MAX_BOUND 10000 #define MAX_BOUND 10000
#endif
#define SERVER_MODE "server" #define SERVER_MODE "server"
#define CLIENT_MODE "client" #define CLIENT_MODE "client"
@ -22,13 +26,11 @@
"Host: archive.0xdeadbeer.org\r\n"\ "Host: archive.0xdeadbeer.org\r\n"\
#define STATEM_RCV_CLT 0b00000001 #define STATEM_RCV_CLT 0b00000001
#define STATEM_PRS_CLT 0b00000010 #define STATEM_CON_SRV 0b00000010
#define STATEM_CON_SRV 0b00000100 #define STATEM_FWD_SRV 0b00000100
#define STATEM_FWD_SRV 0b00001000 #define STATEM_RCV_SRV 0b00001000
#define STATEM_RCV_SRV 0b00010000 #define STATEM_FWD_CLT 0b00010000
#define STATEM_PRS_SRV 0b00100000 #define STATEM_ERR 0b00100000
#define STATEM_FWD_CLT 0b01000000
#define STATEM_ERR 0b10000000
struct header { struct header {
char *key; char *key;
@ -46,4 +48,12 @@ struct request {
struct header *headers; struct header *headers;
}; };
struct conn {
int cltfd;
int srvfd;
struct httpareq cltreq;
struct httpares srvres;
};
#endif #endif