/**
* mds — A micro-display server
* Copyright © 2014 Mattias Andrée (maandree@member.fsf.org)
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see .
*/
#include "raw-data.h"
#include "globals.h"
#include
#include
#include
#include
#include
#include
#include
#include
#include
/**
* Initialise a `source_code_t*`
*
* @param this The `source_code_t*`
*/
void source_code_initialise(source_code_t* restrict this)
{
this->lines = NULL;
this->real_lines = NULL;
this->content = NULL;
this->real_content = NULL;
this->line_count = 0;
}
/**
* Release all data in a `source_code_t*`
*
* @param this The `source_code_t*`
*/
void source_code_destroy(source_code_t* restrict this)
{
free(this->lines), this->lines = NULL;
free(this->real_lines), this->real_lines = NULL;
free(this->content), this->content = NULL;
free(this->real_content), this->real_content = NULL;
}
/**
* Release all data in a `source_code_t*`, and free it
*
* @param this The `source_code_t*`
*/
void source_code_free(source_code_t* restrict this)
{
free(this->lines);
free(this->real_lines);
free(this->content);
free(this->real_content);
free(this);
}
/**
* Read the content of a file, ignoring interruptions
*
* @param pathname The file to read
* @param size Output parameter for the size of the read content, in char:s
* @return The read content, `NULL` on error
*/
static char* read_file(const char* restrict pathname, size_t* restrict size)
{
size_t buf_size = 8096;
size_t buf_ptr = 0;
char* restrict content = NULL;
char* restrict old = NULL;
int fd = -1;
ssize_t got;
/* Allocate buffer for the file's content. */
fail_if (xmalloc(content, buf_size, char));
/* Open the file to compile. */
fail_if ((fd = open(pathname, O_RDONLY)) < 0);
/* Read the file to compile. */
for (;;)
{
/* Make sure the buffer is not small. */
if (buf_size - buf_ptr < 2048)
{
fail_if (xxrealloc(old, content, buf_size <<= 1, char));
}
/* Read a chunk of the file. */
got = read(fd, content + buf_ptr, (buf_size - buf_ptr) * sizeof(char));
if ((got < 0) && (errno == EINTR)) continue;
else if (got < 0) goto pfail;
else if (got == 0) break;
buf_ptr += (size_t)got;
}
/* Shrink the buffer so it is not excessively large. */
fail_if (xxrealloc(old, content, buf_ptr, char));
/* Close file decriptor for the file. */
close(fd);
*size = buf_ptr;
return content;
pfail:
xperror(*argv);
free(old);
free(content);
if (fd >= 0)
close(fd);
return NULL;
}
/**
* Find the end of a function call
*
* @param content The code
* @param offset The index after the first character after the backslash
* that triggered this call
* @param size The length of `code`
* @return The index of the character after the bracket that closes
* the function call (may be outside the code by one character),
* or `size` if the call do not end (that is, the code ends
* prematurely), or zero if there is no function call at `offset`
*/
static __attribute__((pure)) size_t get_end_of_call(char* restrict content, size_t offset, size_t size)
{
#define C content[ptr]
#define r(lower, upper) (((lower) <= C) && (C <= (upper)))
size_t ptr = offset, call_end = 0;
int escape = 0, quote = 0;
/* Skip to end of function name. */
while ((ptr < size) && (r('a', 'z') || r('A', 'Z') || (C == '_')))
ptr++;
/* Check that it is a function call. */
if ((ptr == size) || (ptr == offset) || (C != '('))
return 0;
/* Find the end of the function call. */
while (ptr < size)
{
char c = content[ptr++];
/* Escapes may be longer than one character,
but only the first can affect the parsing. */
if (escape) escape = 0;
/* Nested function and nested quotes can appear. */
else if (ptr <= call_end) ;
/* Quotes end with the same symbols as they start with,
and quotes automatically escape brackets. */
/* \ can either start a functon call or an escape. */
else if (c == '\\')
{
/* It may not be an escape, but registering it
as an escape cannot harm us since we only
skip the first character, and a function call
cannot be that short. */
escape = 1;
/* Nested quotes can appear at function calls. */
call_end = get_end_of_call(content, ptr, size);
}
else if (quote) quote = (c != '"');
/* End of function call, end of fun. */
else if (c == ')') break;
/* " is the quote symbol. */
else if (c == '"') quote = 1;
}
return ptr;
#undef r
#undef C
}
/**
* Remove comments from the content
*
* @param content The code to shrink
* @param size The size of `content`, in char:s
* @return The new size of `content`, in char:s; this function cannot fail
*/
static size_t remove_comments(char* restrict content, size_t size)
{
#define t content[n_ptr++] = c
size_t n_ptr = 0, o_ptr = 0, call_end = 0;
int comment = 0, quote = 0, escape = 0;
while (o_ptr < size)
{
char c = content[o_ptr++];
/* Remove comment. */
if (comment)
{
if (c == '\n') t, comment = 0;
}
/* Escapes may be longer than one character,
but only the first can affect the parsing. */
else if (escape) t, escape = 0;
/* Nested quotes can appear at function calls. */
else if (o_ptr <= call_end) t;
/* \ can either start a functon call or an escape. */
else if (c == '\\')
{
t;
/* It may not be an escape, but registering it
as an escape cannot harm us since we only
skip the first character, and a function call
cannot be that short. */
escape = 1;
/* Nested quotes can appear at function calls. */
call_end = get_end_of_call(content, o_ptr, size);
}
/* Quotes end with the same symbols as they start with,
and quotes automatically escape comments. */
else if (quote)
{
t;
if (c == '"') quote = 0;
}
/* # is the comment symbol. */
else if (c == '#') comment = 1;
/* " is the quote symbol. */
else if (c == '"') t, quote = 1;
/* Code and whitespace. */
else t;
}
return n_ptr;
#undef t
}
/**
* Create an array of each line in a text
*
* @param content The text to split, it must end with an LF.
* LF:s are treated as line endings rather than
* new lines, this means that the final LF will
* not create a new line in the returned array.
* Each LF will be replaced by a NUL-character.
* @param length The length of `content`.
* @return An array of each line in `content`. This
* array will be `NULL`-terminated. It will also
* reuse the allocate of `content`. This means
* that each element must not be free:d, rather
* you should simply free this returned allocation
* and the allocation of `content`. On error
* `NULL` is returned, and `content` will not
* have been modified.
*/
static char** line_split(char* content, size_t length)
{
char** restrict lines = NULL;
size_t count = 0;
size_t i, j;
int new_line = 1;
for (i = 0; i < length; i++)
if (content[i] == '\n')
count++;
fail_if (xmalloc(lines, count + 1, char*));
lines[count] = NULL;
for (i = j = 0; i < length; i++)
{
if (new_line)
new_line = 0, lines[j++] = content + i;
if (content[i] == '\n')
{
new_line = 1;
content[i] = '\0';
}
}
return lines;
pfail:
xperror(*argv);
return NULL;
}
/**
* Read lines of a source file
*
* @param pathname The pathname of the source file
* @param source_code Output parameter for read data
* @return Zero on success, -1 on error
*/
int read_source_lines(const char* restrict pathname, source_code_t* restrict source_code)
{
char* content = NULL;
char* real_content = NULL;
char* old = NULL;
size_t content_size;
size_t real_content_size;
char** lines = NULL;
char** real_lines = NULL;
size_t line_count = 0;
/* Read the file. */
content = read_file(pathname, &content_size);
fail_if (content == NULL);
/* Make sure the content ends with a new line. */
if (!content_size || (content[content_size - 1] != '\n'))
{
fail_if (xxrealloc(old, content, content_size + 1, char));
content[content_size++] = '\n';
}
/* Simplify file. */
fail_if (xmalloc(real_content, content_size, char));
memcpy(real_content, content, content_size * sizeof(char));
real_content_size = content_size;
content_size = remove_comments(content, content_size);
fail_if (xxrealloc(old, content, content_size, char));
/* Split by line. */
fail_if ((lines = line_split(content, content_size)) == NULL);
fail_if ((real_lines = line_split(real_content, real_content_size)) == NULL);
/* Count the number of lines. */
while (lines[line_count] != NULL)
line_count++;
source_code->lines = lines;
source_code->real_lines = real_lines;
source_code->content = content;
source_code->real_content = real_content;
source_code->line_count = line_count;
return 0;
pfail:
xperror(*argv);
free(old);
free(content);
free(real_content);
free(lines);
free(real_lines);
return -1;
}