WebSurf/content/textsearch.c

629 lines
14 KiB
C
Raw Normal View History

/*
* Copyright 2004 John M Bell <jmb202@ecs.soton.ac.uk>
* Copyright 2005 Adrian Lees <adrianl@users.sourceforge.net>
* Copyright 2009 Mark Benjamin <netsurf-browser.org.MarkBenjamin@dfgh.net>
*
* This file is part of NetSurf, http://www.netsurf-browser.org/
*
* NetSurf is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; version 2 of the License.
*
* NetSurf is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*/
/**
* \file
* Free text search
*/
#include <stdbool.h>
#include "utils/errors.h"
#include "utils/utils.h"
#include "netsurf/types.h"
2016-05-30 02:57:22 -07:00
#include "netsurf/search.h"
#include "desktop/selection.h"
#include "desktop/gui_internal.h"
#include "content/content.h"
#include "content/content_protected.h"
#include "content/hlcache.h"
#include "content/textsearch.h"
struct list_entry {
unsigned start_idx; /* start position of match */
unsigned end_idx; /* end of match */
struct box *start_box; /* used only for html contents */
struct box *end_box;
struct selection *sel;
struct list_entry *prev;
struct list_entry *next;
};
/**
* The context for a free text search
*/
struct textsearch_context {
void *gui_p;
2013-04-30 08:15:49 -07:00
struct content *c;
struct list_entry *found;
struct list_entry *current; /* first for select all */
char *string;
bool prev_case_sens;
bool newsearch;
};
/**
* Release the memory used by the list of matches,
* deleting selection objects too
*/
static void free_matches(struct textsearch_context *textsearch)
{
struct list_entry *cur;
struct list_entry *nxt;
cur = textsearch->found->next;
/*
* empty the list before clearing and deleting the selections
* because the the clearing may update the toolkit immediately,
* causing nested accesses to the list
*/
textsearch->found->prev = NULL;
textsearch->found->next = NULL;
for (; cur; cur = nxt) {
nxt = cur->next;
if (cur->sel) {
selection_clear(cur->sel, true);
selection_destroy(cur->sel);
}
free(cur);
}
}
/* Exported function documented in content/textsearch.h */
const char *
content_textsearch_find_pattern(const char *string,
int s_len,
const char *pattern,
int p_len,
bool case_sens,
unsigned int *m_len)
{
struct { const char *ss, *s, *p; bool first; } context[16];
const char *ep = pattern + p_len;
const char *es = string + s_len;
const char *p = pattern - 1; /* a virtual '*' before the pattern */
const char *ss = string;
const char *s = string;
bool first = true;
int top = 0;
while (p < ep) {
bool matches;
if (p < pattern || *p == '*') {
char ch;
/* skip any further asterisks; one is the same as many
*/
do p++; while (p < ep && *p == '*');
/* if we're at the end of the pattern, yes, it matches
*/
if (p >= ep) break;
/* anything matches a # so continue matching from
here, and stack a context that will try to match
the wildcard against the next character */
ch = *p;
if (ch != '#') {
/* scan forwards until we find a match for
this char */
if (!case_sens) ch = toupper(ch);
while (s < es) {
if (case_sens) {
if (*s == ch) break;
} else if (toupper(*s) == ch)
break;
s++;
}
}
if (s < es) {
/* remember where we are in case the match
fails; we may then resume */
if (top < (int)NOF_ELEMENTS(context)) {
context[top].ss = ss;
context[top].s = s + 1;
context[top].p = p - 1;
/* ptr to last asterisk */
context[top].first = first;
top++;
}
if (first) {
ss = s;
/* remember first non-'*' char */
first = false;
}
matches = true;
2013-04-30 08:15:49 -07:00
} else {
matches = false;
2013-04-30 08:15:49 -07:00
}
} else if (s < es) {
char ch = *p;
if (ch == '#')
matches = true;
else {
if (case_sens)
matches = (*s == ch);
else
matches = (toupper(*s) == toupper(ch));
}
if (matches && first) {
ss = s; /* remember first non-'*' char */
first = false;
}
2013-04-30 08:15:49 -07:00
} else {
matches = false;
2013-04-30 08:15:49 -07:00
}
if (matches) {
p++; s++;
2013-04-30 08:15:49 -07:00
} else {
/* doesn't match,
* resume with stacked context if we have one */
if (--top < 0)
return NULL; /* no match, give up */
ss = context[top].ss;
s = context[top].s;
p = context[top].p;
first = context[top].first;
}
}
/* end of pattern reached */
*m_len = max(s - ss, 1);
return ss;
}
2012-08-14 03:23:03 -07:00
/* Exported function documented in content/textsearch.h */
nserror
content_textsearch_add_match(struct textsearch_context *context,
unsigned start_idx,
unsigned end_idx,
struct box *start_box,
struct box *end_box)
2012-08-14 03:23:03 -07:00
{
struct list_entry *entry;
/* found string in box => add to list */
entry = calloc(1, sizeof(*entry));
if (entry == NULL) {
return NSERROR_NOMEM;
2012-08-14 03:23:03 -07:00
}
entry->start_idx = start_idx;
entry->end_idx = end_idx;
entry->start_box = start_box;
entry->end_box = end_box;
2012-08-14 03:23:03 -07:00
entry->sel = NULL;
entry->next = NULL;
2012-08-14 03:23:03 -07:00
entry->prev = context->found->prev;
2013-04-30 08:15:49 -07:00
2019-11-10 12:32:37 -08:00
if (context->found->prev == NULL) {
2012-08-14 03:23:03 -07:00
context->found->next = entry;
2019-11-10 12:32:37 -08:00
} else {
2012-08-14 03:23:03 -07:00
context->found->prev->next = entry;
2019-11-10 12:32:37 -08:00
}
2013-04-30 08:15:49 -07:00
2012-08-14 03:23:03 -07:00
context->found->prev = entry;
return NSERROR_OK;
}
2012-08-14 03:23:03 -07:00
/**
* Specifies whether all matches or just the current match should
* be highlighted in the search text.
*/
static void search_show_all(bool all, struct textsearch_context *context)
{
struct list_entry *a;
nserror res;
for (a = context->found->next; a; a = a->next) {
bool add = true;
if (!all && a != context->current) {
add = false;
if (a->sel) {
selection_clear(a->sel, true);
selection_destroy(a->sel);
a->sel = NULL;
}
}
if (add && !a->sel) {
res = context->c->handler->create_selection(context->c,
&a->sel);
if (res == NSERROR_OK) {
selection_set_start(a->sel, a->start_idx);
selection_set_end(a->sel, a->end_idx);
}
}
}
}
2012-08-14 03:23:03 -07:00
/**
* Search for a string in the box tree
*
* \param string the string to search for
* \param string_len length of search string
2014-11-08 08:49:32 -08:00
* \param context The search context to add the entry to.
* \param flags flags to control the search.
2012-08-14 03:23:03 -07:00
*/
static nserror
search_text(const char *string,
int string_len,
struct textsearch_context *context,
search_flags_t flags)
2012-08-14 03:23:03 -07:00
{
struct rect bounds;
union content_msg_data msg_data;
bool case_sensitive, forwards, showall;
nserror res = NSERROR_OK;
2012-08-14 03:23:03 -07:00
case_sensitive = ((flags & SEARCH_FLAG_CASE_SENSITIVE) != 0) ?
true : false;
forwards = ((flags & SEARCH_FLAG_FORWARDS) != 0) ? true : false;
showall = ((flags & SEARCH_FLAG_SHOWALL) != 0) ? true : false;
if (context->c == NULL) {
return res;
}
2012-08-14 03:23:03 -07:00
/* check if we need to start a new search or continue an old one */
if ((context->newsearch) ||
(context->prev_case_sens != case_sensitive)) {
2012-08-14 03:23:03 -07:00
if (context->string != NULL) {
2012-08-14 03:23:03 -07:00
free(context->string);
}
2013-04-30 08:15:49 -07:00
2012-08-14 03:23:03 -07:00
context->current = NULL;
free_matches(context);
context->string = malloc(string_len + 1);
if (context->string != NULL) {
memcpy(context->string, string, string_len);
context->string[string_len] = '\0';
}
guit->search->hourglass(true, context->gui_p);
2012-08-14 03:23:03 -07:00
/* call content find handler */
res = context->c->handler->textsearch_find(context->c,
context,
string,
string_len,
case_sensitive);
2012-08-14 03:23:03 -07:00
guit->search->hourglass(false, context->gui_p);
if (res != NSERROR_OK) {
2012-08-14 03:23:03 -07:00
free_matches(context);
return res;
2012-08-14 03:23:03 -07:00
}
context->prev_case_sens = case_sensitive;
2013-04-30 08:15:49 -07:00
2012-08-14 03:23:03 -07:00
/* new search, beginning at the top of the page */
context->current = context->found->next;
context->newsearch = false;
2013-04-30 08:15:49 -07:00
} else if (context->current != NULL) {
2012-08-14 03:23:03 -07:00
/* continued search in the direction specified */
if (forwards) {
if (context->current->next)
context->current = context->current->next;
2013-04-30 08:15:49 -07:00
} else {
2012-08-14 03:23:03 -07:00
if (context->current->prev)
context->current = context->current->prev;
}
}
guit->search->status((context->current != NULL), context->gui_p);
2013-04-30 08:15:49 -07:00
2012-08-14 03:23:03 -07:00
search_show_all(showall, context);
guit->search->back_state((context->current != NULL) &&
2012-08-14 03:23:03 -07:00
(context->current->prev != NULL),
context->gui_p);
guit->search->forward_state((context->current != NULL) &&
(context->current->next != NULL),
context->gui_p);
2012-08-14 03:23:03 -07:00
if (context->current == NULL) {
return res;
}
/* call content match bounds handler */
res = context->c->handler->textsearch_bounds(context->c,
context->current->start_idx,
context->current->end_idx,
context->current->start_box,
context->current->end_box,
&bounds);
if (res == NSERROR_OK) {
msg_data.scroll.area = true;
msg_data.scroll.x0 = bounds.x0;
msg_data.scroll.y0 = bounds.y0;
msg_data.scroll.x1 = bounds.x1;
msg_data.scroll.y1 = bounds.y1;
content_broadcast(context->c, CONTENT_MSG_SCROLL, &msg_data);
2012-08-14 03:23:03 -07:00
}
return res;
2012-08-14 03:23:03 -07:00
}
/**
* Begins/continues the search process
*
* \note that this may be called many times for a single search.
*
* \param context The search context in use.
* \param flags The flags forward/back etc
* \param string The string to match
*/
static nserror
content_textsearch_step(struct textsearch_context *textsearch,
search_flags_t flags,
const char *string)
2012-08-14 03:23:03 -07:00
{
int string_len;
int i = 0;
nserror res = NSERROR_OK;
2012-08-14 03:23:03 -07:00
assert(textsearch != NULL);
2012-08-14 03:23:03 -07:00
guit->search->add_recent(string, textsearch->gui_p);
2012-08-14 03:23:03 -07:00
string_len = strlen(string);
for (i = 0; i < string_len; i++) {
2013-04-30 08:15:49 -07:00
if (string[i] != '#' && string[i] != '*')
break;
}
if (i < string_len) {
res = search_text(string, string_len, textsearch, flags);
} else {
2012-08-14 03:23:03 -07:00
union content_msg_data msg_data;
free_matches(textsearch);
guit->search->status(true, textsearch->gui_p);
guit->search->back_state(false, textsearch->gui_p);
guit->search->forward_state(false, textsearch->gui_p);
2012-08-14 03:23:03 -07:00
msg_data.scroll.area = false;
msg_data.scroll.x0 = 0;
msg_data.scroll.y0 = 0;
content_broadcast(textsearch->c, CONTENT_MSG_SCROLL, &msg_data);
2012-08-14 03:23:03 -07:00
}
return res;
2012-08-14 03:23:03 -07:00
}
/* Exported function documented in content/textsearch.h */
bool
content_textsearch_ishighlighted(struct textsearch_context *textsearch,
unsigned start_offset,
unsigned end_offset,
unsigned *start_idx,
unsigned *end_idx)
{
struct list_entry *cur;
for (cur = textsearch->found->next; cur != NULL; cur = cur->next) {
if (cur->sel &&
selection_defined(cur->sel) &&
selection_highlighted(cur->sel,
start_offset,
end_offset,
start_idx,
end_idx)) {
return true;
}
}
return false;
}
2012-08-14 03:23:03 -07:00
/* Exported function documented in content/textsearch.h */
/**
* create a search_context
*
* \param c The content the search_context is connected to
* \param context A context pointer passed to the provider routines.
* \param search_out A pointer to recive the new text search context
* \return NSERROR_OK on success and \a search_out updated else error code
*/
static nserror
content_textsearch_create(struct content *c,
void *gui_data,
struct textsearch_context **textsearch_out)
{
struct textsearch_context *context;
struct list_entry *search_head;
content_type type;
if ((c->handler->textsearch_find == NULL) ||
(c->handler->textsearch_bounds == NULL) ||
(c->handler->create_selection == NULL)){
/*
* content has no free text find handler so searching
* is unsupported.
*/
return NSERROR_NOT_IMPLEMENTED;
}
type = c->handler->type();
context = malloc(sizeof(struct textsearch_context));
if (context == NULL) {
return NSERROR_NOMEM;
}
search_head = malloc(sizeof(struct list_entry));
if (search_head == NULL) {
free(context);
return NSERROR_NOMEM;
}
search_head->start_idx = 0;
search_head->end_idx = 0;
search_head->start_box = NULL;
search_head->end_box = NULL;
search_head->sel = NULL;
search_head->prev = NULL;
search_head->next = NULL;
context->found = search_head;
context->current = NULL;
context->string = NULL;
context->prev_case_sens = false;
context->newsearch = true;
context->c = c;
context->gui_p = gui_data;
*textsearch_out = context;
return NSERROR_OK;
}
/* Exported function documented in search.h */
nserror content_textsearch_destroy(struct textsearch_context *textsearch)
{
assert(textsearch != NULL);
if (textsearch->string != NULL) {
guit->search->add_recent(textsearch->string, textsearch->gui_p);
free(textsearch->string);
}
guit->search->forward_state(true, textsearch->gui_p);
guit->search->back_state(true, textsearch->gui_p);
free_matches(textsearch);
free(textsearch);
return NSERROR_OK;
}
/**
* Terminate a search.
*
* \param c content to clear
*/
static nserror content_textsearch__clear(struct content *c)
{
free(c->textsearch.string);
c->textsearch.string = NULL;
if (c->textsearch.context != NULL) {
content_textsearch_destroy(c->textsearch.context);
c->textsearch.context = NULL;
}
return NSERROR_OK;
}
/* exported interface, documented in content/textsearch.h */
nserror
content_textsearch(struct hlcache_handle *h,
void *context,
search_flags_t flags,
const char *string)
{
struct content *c = hlcache_handle_get_content(h);
nserror res;
assert(c != NULL);
if (string != NULL &&
c->textsearch.string != NULL &&
c->textsearch.context != NULL &&
strcmp(string, c->textsearch.string) == 0) {
/* Continue prev. search */
content_textsearch_step(c->textsearch.context, flags, string);
} else if (string != NULL) {
/* New search */
free(c->textsearch.string);
c->textsearch.string = strdup(string);
if (c->textsearch.string == NULL) {
return NSERROR_NOMEM;
}
if (c->textsearch.context != NULL) {
content_textsearch_destroy(c->textsearch.context);
c->textsearch.context = NULL;
}
res = content_textsearch_create(c,
context,
&c->textsearch.context);
if (res != NSERROR_OK) {
return res;
}
content_textsearch_step(c->textsearch.context, flags, string);
} else {
/* Clear search */
content_textsearch__clear(c);
free(c->textsearch.string);
c->textsearch.string = NULL;
}
return NSERROR_OK;
}
/* exported interface, documented in content/textsearch.h */
nserror content_textsearch_clear(struct hlcache_handle *h)
{
struct content *c = hlcache_handle_get_content(h);
assert(c != 0);
return(content_textsearch__clear(c));
}