summaryrefslogtreecommitdiff
path: root/deps/drassil/mysql-tools/dump-parser.c
blob: a9262d4f9205425b15d4e17db2fe0090a6d04650 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
/* gcc -O2 -Wall -pedantic dump-parser.c -o dump-parser
 Usage: cat dump.sql | dump-parser
   Or : dump-parser dump.sql
 bugs :
 * the parser will fail if the 10001st character of a line is an escaped quote, it will see it as an unescaped quote.
*/
 
#include <stdio.h>
#include <stdlib.h>
#include <stdbool.h>
#include <string.h>
 
#define BUFFER 100000
 
bool is_escaped(char* string, int offset) {
    if (offset == 0) {
        return false;
    } else if (string[offset - 1] == '\\') {
        return !is_escaped(string, offset - 1);
    } else {
        return false;
    }
}
 
bool is_commented(char* string) {
    char buffer[4];
 
    sprintf(buffer, "%.3s", string);
 
    return strcmp(buffer, "-- ") == 0;
}
 
int main(int argc, char *argv[])
{
    FILE* file = argc > 1 ? fopen(argv[1], "r") : stdin;
 
    char buffer[BUFFER];
    char* line;
    int pos;
    int parenthesis = 0;
    bool quote = false;
    bool escape = false;
    bool comment = false;
 
    while (fgets(buffer, BUFFER, file) != NULL) {
        line = buffer;
 
        /* skip commented */
        if (comment || is_commented(line)) {
            comment = line[strlen(line) - 1] != '\n';
            fputs(line, stdout);
        } else {
            pos = 0;
 
            nullchar:
            while (line[pos] != '\0') {
                /* if we are still in escape state, we need to check first char. */
                if (!escape) {
                     /* find any character in ()' */
                    pos = strcspn(line, "()'\\");
                }
 
                if (pos > 0) {
                    /* print before match */
                    printf("%.*s", pos, line);
                }
 
                switch (line[pos]) {
                    case '(':
                        if (!quote) {
                            if (parenthesis == 0) {
                                putchar('\n');
                            }
                            parenthesis++;
                        }
                        if (escape) {
                            escape = false;
                        }
                        break;
 
                    case ')':
                        if (!quote) {
                            if (parenthesis > 0) {
                                parenthesis--;
                            } else {
                                /* whoops */
                                puts("\n");
                                fputs(line, stdout);
                                fputs("Found closing parenthesis without opening one.\n", stderr);
                                exit(1);
                            }
                        }
                        if (escape) {
                            escape = false;
                        }
                        break;
 
                    case '\\':
                        escape = !escape;
                        break;
 
                    case '\'':
                        if (escape) {
                            escape = false;
                        } else {
                            quote = !quote;
                        }
                        break;
 
                    case '\0':
                        goto nullchar;
 
                    default:
                        if (escape) {
                            escape = false;
                        }
                        break;
                }
 
                /* print char then skip it (to make sure we don’t double match) */
                putchar(line[pos]);
                line = line + pos + 1;
                pos = 0;
            }
        }
    }
 
    return 0;
}