#include <sys/types.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <err.h>
#include <errno.h>
#include <fcntl.h>
#include <getopt.h>
#include <limits.h>
#include <locale.h>
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <unistd.h>
#include <wchar.h>
#include <wctype.h>
#include "pathnames.h"
static char _path_words[] = _PATH_WORDS;
#define EQUAL 0
#define GREATER 1
#define LESS (-1)
static int dflag, fflag;
static char *binary_search(wchar_t *, unsigned char *, unsigned char *);
static int compare(wchar_t *, unsigned char *, unsigned char *);
static char *linear_search(wchar_t *, unsigned char *, unsigned char *);
static int look(wchar_t *, unsigned char *, unsigned char *);
static wchar_t *prepkey(const char *, wchar_t);
static void print_from(wchar_t *, unsigned char *, unsigned char *);
static void usage(void) __dead2;
static struct option longopts[] = {
{ "alternative",no_argument, NULL, 'a' },
{ "alphanum", no_argument, NULL, 'd' },
{ "ignore-case",no_argument, NULL, 'i' },
{ "terminate", required_argument, NULL, 't'},
{ NULL, 0, NULL, 0 },
};
int
main(int argc, char *argv[])
{
struct stat sb;
int ch, fd, match;
wchar_t termchar;
unsigned char *back, *front;
unsigned const char *file;
wchar_t *key;
(void) setlocale(LC_CTYPE, "");
file = _path_words;
termchar = L'\0';
while ((ch = getopt_long(argc, argv, "+adft:", longopts, NULL)) != -1)
switch(ch) {
case 'a':
break;
case 'd':
dflag = 1;
break;
case 'f':
fflag = 1;
break;
case 't':
if (mbrtowc(&termchar, optarg, MB_LEN_MAX, NULL) !=
strlen(optarg))
errx(2, "invalid termination character");
break;
case '?':
default:
usage();
}
argc -= optind;
argv += optind;
if (argc == 0)
usage();
if (argc == 1)
dflag = fflag = 1;
key = prepkey(*argv++, termchar);
if (argc >= 2)
file = *argv++;
match = 1;
do {
if ((fd = open(file, O_RDONLY, 0)) < 0 || fstat(fd, &sb))
err(2, "%s", file);
if ((uintmax_t)sb.st_size > (uintmax_t)SIZE_T_MAX)
errx(2, "%s: %s", file, strerror(EFBIG));
if (sb.st_size == 0) {
close(fd);
continue;
}
if ((front = mmap(NULL, (size_t)sb.st_size, PROT_READ, MAP_SHARED, fd, (off_t)0)) == MAP_FAILED)
err(2, "%s", file);
back = front + sb.st_size;
match *= (look(key, front, back));
close(fd);
} while (argc-- > 2 && (file = *argv++));
exit(match);
}
static wchar_t *
prepkey(const char *string, wchar_t termchar)
{
const char *readp;
wchar_t *key, *writep;
wchar_t ch;
size_t clen;
if ((key = malloc(sizeof(wchar_t) * (strlen(string) + 1))) == NULL)
err(2, NULL);
readp = string;
writep = key;
while ((clen = mbrtowc(&ch, readp, MB_LEN_MAX, NULL)) != 0) {
if (clen == (size_t)-1 || clen == (size_t)-2)
errc(2, EILSEQ, NULL);
if (fflag)
ch = towlower(ch);
if (!dflag || iswalnum(ch))
*writep++ = ch;
readp += clen;
}
*writep = L'\0';
if (termchar != L'\0' && (writep = wcschr(key, termchar)) != NULL)
*++writep = L'\0';
return (key);
}
static int
look(wchar_t *string, unsigned char *front, unsigned char *back)
{
front = binary_search(string, front, back);
front = linear_search(string, front, back);
if (front)
print_from(string, front, back);
return (front ? 0 : 1);
}
#define SKIP_PAST_NEWLINE(p, back) \
while (p < back && *p++ != '\n');
static char *
binary_search(wchar_t *string, unsigned char *front, unsigned char *back)
{
unsigned char *p;
p = front + (back - front) / 2;
SKIP_PAST_NEWLINE(p, back);
while (p < back && back > front) {
if (compare(string, p, back) == GREATER)
front = p;
else
back = p;
p = front + (back - front) / 2;
SKIP_PAST_NEWLINE(p, back);
}
return (front);
}
static char *
linear_search(wchar_t *string, unsigned char *front, unsigned char *back)
{
while (front < back) {
switch (compare(string, front, back)) {
case EQUAL:
return (front);
case LESS:
return (NULL);
case GREATER:
break;
}
SKIP_PAST_NEWLINE(front, back);
}
return (NULL);
}
static void
print_from(wchar_t *string, unsigned char *front, unsigned char *back)
{
for (; front < back && compare(string, front, back) == EQUAL; ++front) {
for (; front < back && *front != '\n'; ++front)
if (putchar(*front) == EOF)
err(2, "stdout");
if (putchar('\n') == EOF)
err(2, "stdout");
}
}
static int
compare(wchar_t *s1, unsigned char *s2, unsigned char *back)
{
wchar_t ch1, ch2;
size_t len2;
for (; *s1 && s2 < back && *s2 != '\n'; ++s1, s2 += len2) {
ch1 = *s1;
len2 = mbrtowc(&ch2, s2, back - s2, NULL);
if (len2 == (size_t)-1 || len2 == (size_t)-2) {
ch2 = *s2;
len2 = 1;
}
if (fflag)
ch2 = towlower(ch2);
if (dflag && !iswalnum(ch2)) {
--s1;
continue;
}
if (ch1 != ch2)
return (ch1 < ch2 ? LESS : GREATER);
}
return (*s1 ? GREATER : EQUAL);
}
static void
usage(void)
{
(void)fprintf(stderr, "usage: look [-df] [-t char] string [file ...]\n");
exit(2);
}