/*
arfnet2-search: Fast file indexer and search
Copyright (C) 2023 arf20 (Ángel Ruiz Fernandez)
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see .
index.c: Efficient fast file index
*/
#include "index.h"
#include
#include
#include
#include
#include
#include
#include
#include "config.h"
/* closed addressing map */
typedef struct map_s {
struct node_s *map;
size_t count, size;
} map_t;
struct node_s {
node_data_t *data;
struct node_s *next;
map_t *child;
};
static magic_t magic_cookie = NULL;
size_t
hash(const char *s, int mod)
{
size_t hash = 0;
if (!s)
return 0;
while (*s)
hash = hash * 31 + *s++;
return hash % mod;
}
map_t *
map_new(size_t size)
{
map_t *map = malloc(sizeof(map_t));
map->map = malloc(sizeof(struct node_s) * size);
memset(map->map, 0, sizeof(struct node_s) * size);
map->size = size;
map->count = 0;
return map;
}
void
map_insert(map_t *map, const char *key, node_data_t *data, map_t *child)
{
struct node_s *node = &map->map[hash(key, map->size)];
if (node->data) {
for (; node->next; node = node->next);
node->next = malloc(sizeof(struct node_s));
node->next->data = data;
node->next->child = child;
node->next->next = NULL;
} else {
node->data = data;
node->child = child;
}
map->count++;
}
results_t *
results_new()
{
results_t *r = malloc(sizeof(results_t));
r->capacity = INIT_VEC_CAPACITY;
r->results = malloc(sizeof(node_data_t*) * r->capacity);
memset(r->results, 0, sizeof(node_data_t*) * r->capacity);
r->size = 0;
return r;
}
void
results_insert(results_t *results, const node_data_t *result)
{
if (results->size + 1 >= results->capacity) {
results->capacity *= 2;
results->results = realloc(results->results, sizeof(node_data_t*) *
results->capacity);
}
results->results[results->size++] = result;
}
int
index_init()
{
magic_cookie = magic_open(MAGIC_MIME);
if (!magic_cookie) {
fprintf(stderr, "[index] error magic_open()\n");
return -1;
}
if (magic_load(magic_cookie, NULL) < 0) {
fprintf(stderr, "[index] error magic_load(): %s\n",
magic_error(magic_cookie));
return -1;
}
return 0;
}
void
index_deinit()
{
magic_close(magic_cookie);
}
map_t *
index_new(size_t icapacity, const char *dir, int examine)
{
DIR *dirp = opendir(dir);
if (!dirp) {
fprintf(stderr, "[index] error opening directory %s: %s\n", dir,
strerror(errno));
return NULL;
}
map_t *map = map_new(icapacity);
char path[4096];
struct dirent *de = NULL;
while ((de = readdir(dirp))) {
if (de->d_name[0] == '.') {
if (de->d_name[1] == '\0')
continue;
else if (de->d_name[1] == '.')
if (de->d_name[2] == '\0')
continue;
}
snprintf(path, 4096, "%s/%s", dir, de->d_name);
/* stat it */
node_data_t *data = malloc(sizeof(node_data_t));
data->name = strdup(de->d_name);
if (stat(path, &data->stat) < 0) {
fprintf(stderr, "[index] error stat() %s: %s\n", path,
strerror(errno));
free(data);
data = NULL;
}
/* examine */
if (examine) {
data->mime = magic_file(magic_cookie, path);
if (!data->mime)
fprintf(stderr, "[index] error magic_file() %s: %s\n", path,
magic_error(magic_cookie));
}
/* recurse */
map_t *child = NULL;
if (de->d_type == DT_DIR) {
index_new(icapacity, path);
}
map_insert(map, de->d_name, data, child);
}
return map;
}
int
index_lookup_substr(map_t *index, const char *query,
results_t *results)
{
for (size_t i = 0; i < index->size; i++) {
if (!index->map[i].data)
continue;
for (struct node_s *node = &index->map[i]; node->next; node = node->next)
if (strstr(node->data.name, query))
results_insert(results, )
}
}
results_t *
index_lookup(map_t *index, lookup_type_t type, const char *query)
{
results_t *results = results_new();
switch (type) {
case LOOKUP_SUBSTR:
return index_lookup_substr(index, query, results);
break;
}
}
void
index_destroy(index_t index)
{
}