summaryrefslogtreecommitdiff
path: root/src/detab.c
diff options
context:
space:
mode:
authorJohn MacFarlane <jgm@berkeley.edu>2014-09-17 14:05:04 -0700
committerJohn MacFarlane <jgm@berkeley.edu>2014-09-17 14:05:04 -0700
commit309173a493aea59cce5cce1b52b86e01b041bb8f (patch)
tree30eea56599b096d11cf4eaad38d395b3910a35b4 /src/detab.c
parent6326bc748c8f5f225d82c01fe6763776f2bbd88e (diff)
parent3aa56049d4b52b55a2313e51698090ee81e10036 (diff)
Merge pull request #66 from vmg/revamp
Enfastenate the C Parsenator
Diffstat (limited to 'src/detab.c')
-rw-r--r--src/detab.c48
1 files changed, 0 insertions, 48 deletions
diff --git a/src/detab.c b/src/detab.c
deleted file mode 100644
index e03fcf7..0000000
--- a/src/detab.c
+++ /dev/null
@@ -1,48 +0,0 @@
-#include "bstrlib.h"
-
-// UTF-8 aware detab: assumes s has no newlines, or only a final newline.
-// Return 0 on success, BSTR_ERR if invalid UTF-8.
-extern int bdetab(bstring s, int utf8)
-{
- unsigned char c;
- int pos = 0; // a count of characters
- int byte = 0; // a count of bytes
- int high_chars_to_skip = 0;
- int numspaces = 0;
- while ((c = bchar(s, byte))) {
- if (utf8 && high_chars_to_skip > 0) {
- if (c >= 0x80) {
- high_chars_to_skip--;
- byte++;
- } else {
- return BSTR_ERR; // invalid utf-8
- }
- } else if (c == '\t') {
- bdelete(s, byte, 1); // delete tab character
- numspaces = 4 - (pos % 4);
- binsertch(s, byte, numspaces, ' ');
- byte += numspaces;
- pos += numspaces;
- } else if (c <= 0x80 || !utf8) {
- byte++;
- pos++;
- } else { // multibyte utf8 sequences
- if (c >> 1 == 0176) {
- high_chars_to_skip = 5;
- } else if (c >> 2 == 076) {
- high_chars_to_skip = 4;
- } else if (c >> 3 == 036) {
- high_chars_to_skip = 3;
- } else if (c >> 4 == 016) {
- high_chars_to_skip = 2;
- } else if (c >> 5 == 06) {
- high_chars_to_skip = 1;
- } else {
- return BSTR_ERR; // invalid utf-8
- }
- pos++;
- byte++;
- }
- }
- return 0;
-}