diff options
Diffstat (limited to 'src/region-cache.h')
-rw-r--r-- | src/region-cache.h | 111 |
1 files changed, 111 insertions, 0 deletions
diff --git a/src/region-cache.h b/src/region-cache.h new file mode 100644 index 00000000000..b9f20fc4f58 --- /dev/null +++ b/src/region-cache.h @@ -0,0 +1,111 @@ +/* Header file: Caching facts about regions of the buffer, for optimization. + Copyright (C) 1985, 1986, 1993 Free Software Foundation, Inc. + +This file is part of GNU Emacs. + +GNU Emacs is free software; you can redistribute it and/or modify +it under the terms of the GNU General Public License as published by +the Free Software Foundation; either version 2, or (at your option) +any later version. + +GNU Emacs is distributed in the hope that it will be useful, +but WITHOUT ANY WARRANTY; without even the implied warranty of +MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +GNU General Public License for more details. + +You should have received a copy of the GNU General Public License +along with GNU Emacs; see the file COPYING. If not, write to +the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA. */ + + +/* This code was written by Jim Blandy <jimb@cs.oberlin.edu> to help + GNU Emacs better support the gene editor written for the University + of Illinois at Urbana-Champagne's Ribosome Database Project (RDP). + + Emacs implements line operations (finding the beginning/end of the + line, vertical motion, all the redisplay stuff) by searching for + newlines in the buffer. Usually, this is a good design; it's very + clean to just represent the buffer as an unstructured string of + characters, and the lines in most files are very short (less than + eighty characters), meaning that scanning usually costs about the + same as the overhead of maintaining some more complicated data + structure. + + However, some applications, like gene editing, make use of very + long lines --- on the order of tens of kilobytes. In such cases, + it may well be worthwhile to try to avoid scanning, because the + scans have become two orders of magnitude more expensive. It would + be nice if this speedup could preserve the simplicity of the + existing data structure, and disturb as little of the existing code + as possible. + + So here's the tack. We add some caching to the scan_buffer + function, so that when it searches for a newline, it notes that the + region between the start and end of the search contained no + newlines; then, the next time around, it consults this cache to see + if there are regions of text it can skip over completely. The + buffer modification primitives invalidate this cache. + + (Note: Since the redisplay code needs similar information on + modified regions of the buffer, we can use the code that helps out + redisplay as a guide to where we need to add our own code to + invalidate our cache. prepare_to_modify_buffer seems to be the + central spot.) + + Note that the cache code itself never mentions newlines + specifically, so if you wanted to cache other properties of regions + of the buffer, you could use this code pretty much unchanged. So + this cache really holds "known/unknown" information --- "I know + this region has property P" vs. "I don't know if this region has + property P or not." */ + + +/* Allocate, initialize and return a new, empty region cache. */ +struct region_cache *new_region_cache ( /* void */ ); + +/* Free a region cache. */ +void free_region_cache ( /* struct region_cache * */ ); + +/* Assert that the region of BUF between START and END (absolute + buffer positions) is "known," for the purposes of CACHE (e.g. "has + no newlines", in the case of the line cache). */ +extern void know_region_cache ( /* struct buffer *BUF, + struct region_cache *CACHE, + int START, END */ ); + +/* Indicate that a section of BUF has changed, to invalidate CACHE. + HEAD is the number of chars unchanged at the beginning of the buffer. + TAIL is the number of chars unchanged at the end of the buffer. + NOTE: this is *not* the same as the ending position of modified + region. + (This way of specifying regions makes more sense than absolute + buffer positions in the presence of insertions and deletions; the + args to pass are the same before and after such an operation.) */ +extern void invalidate_region_cache ( /* struct buffer *BUF, + struct region_cache *CACHE, + int HEAD, TAIL */ ); + +/* The scanning functions. + + Basically, if you're scanning forward/backward from position POS, + and region_cache_forward/backward returns true, you can skip all + the text between POS and *NEXT. And if the function returns false, + you should examine all the text from POS to *NEXT, and call + know_region_cache depending on what you find there; this way, you + might be able to avoid scanning it again. */ + +/* Return true if the text immediately after POS in BUF is known, for + the purposes of CACHE. If NEXT is non-zero, set *NEXT to the nearest + position after POS where the knownness changes. */ +extern int region_cache_forward ( /* struct buffer *BUF, + struct region_cache *CACHE, + int POS, + int *NEXT */ ); + +/* Return true if the text immediately before POS in BUF is known, for + the purposes of CACHE. If NEXT is non-zero, set *NEXT to the nearest + position before POS where the knownness changes. */ +extern int region_cache_backward ( /* struct buffer *BUF, + struct region_cache *CACHE, + int POS, + int *NEXT */ ); |