procps/proc/escape.c

217 lines
5.7 KiB
C
Raw Normal View History

2002-02-02 06:47:29 +08:00
/*
* Copyright 1998-2002 by Albert Cahalan; all rights resered.
2002-02-02 06:47:29 +08:00
* This file may be used subject to the terms and conditions of the
* GNU Library General Public License Version 2, or any later version
* at your option, as published by the Free Software Foundation.
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU Library General Public License for more details.
*/
2004-11-05 04:50:59 +08:00
#include <stdio.h>
2002-02-02 06:47:29 +08:00
#include <sys/types.h>
2002-12-21 18:34:50 +08:00
#include <string.h>
#include "procps.h"
#include "escape.h"
#include "readproc.h"
2002-02-02 06:47:29 +08:00
2004-11-05 04:50:59 +08:00
#if (__GNU_LIBRARY__ >= 6)
# include <wchar.h>
# include <wctype.h>
# include <stdlib.h> /* MB_CUR_MAX */
# include <ctype.h>
# include <langinfo.h>
#endif
2002-12-21 18:34:50 +08:00
2004-11-05 04:50:59 +08:00
#if (__GNU_LIBRARY__ >= 6)
static int escape_str_utf8(char *restrict dst, const char *restrict src, int bufsize, int *maxcells){
int my_cells = 0;
int my_bytes = 0;
mbstate_t s;
memset(&s, 0, sizeof (s));
for(;;) {
wchar_t wc;
int len = 0;
if(my_cells >= *maxcells || my_bytes+1 >= bufsize)
2002-02-02 06:47:29 +08:00
break;
2004-11-05 04:50:59 +08:00
if (!(len = mbrtowc (&wc, src, MB_CUR_MAX, &s)))
/* 'str' contains \0 */
2002-02-02 06:47:29 +08:00
break;
2004-11-05 04:50:59 +08:00
if (len < 0) {
/* invalid multibyte sequence -- zeroize state */
memset (&s, 0, sizeof (s));
*(dst++) = '?';
src++;
my_cells++;
my_bytes++;
} else if (len==1) {
/* non-multibyte */
*(dst++) = isprint(*src) ? *src : '?';
src++;
my_cells++;
my_bytes++;
} else if (!iswprint(wc)) {
/* multibyte - no printable */
*(dst++) = '?';
src+=len;
my_cells++;
my_bytes++;
} else {
/* multibyte - printable */
int wlen = wcwidth(wc);
if (wlen==0) {
// invisible multibyte -- we don't ignore it, because some terminal
// interpret it wrong and more safe is replace it with '?'
*(dst++) = '?';
src+=len;
my_cells++;
my_bytes++;
} else {
// multibyte - printable
// Got space?
if (my_cells+wlen > *maxcells || my_bytes+1+len >= bufsize) break;
// 0x9b is control byte for some terminals
if (memchr(src, 0x9B, len)) {
// unsafe multibyte
*(dst++) = '?';
src+=len;
my_cells++;
my_bytes++;
} else {
// safe multibyte
memcpy(dst, src, len);
my_cells += wlen;
dst += len;
my_bytes += len;
src += len;
}
}
2002-02-02 06:47:29 +08:00
}
2004-11-05 04:50:59 +08:00
//fprintf(stdout, "cells: %d\n", my_cells);
2002-02-02 06:47:29 +08:00
}
*(dst++) = '\0';
2004-11-05 04:50:59 +08:00
// fprintf(stderr, "maxcells: %d, my_cells; %d\n", *maxcells, my_cells);
*maxcells -= my_cells;
return my_bytes; // bytes of text, excluding the NUL
2002-02-02 06:47:29 +08:00
}
2004-11-05 04:50:59 +08:00
#endif /* __GNU_LIBRARY__ */
2002-02-02 06:47:29 +08:00
/* sanitize a string via one-way mangle */
2004-11-05 04:50:59 +08:00
int escape_str(char *restrict dst, const char *restrict src, int bufsize, int *maxcells){
2002-02-02 06:47:29 +08:00
unsigned char c;
2004-11-05 04:50:59 +08:00
int my_cells = 0;
2002-12-21 21:07:53 +08:00
int my_bytes = 0;
2002-11-27 08:24:01 +08:00
const char codes[] =
2002-02-02 06:47:29 +08:00
"Z-------------------------------"
"********************************"
"********************************"
"*******************************-"
"--------------------------------"
"********************************"
"********************************"
"********************************";
2004-11-05 04:50:59 +08:00
#if (__GNU_LIBRARY__ >= 6)
static int utf_init=0;
if(utf_init==0){
/* first call -- check if UTF stuff is usable */
char *enc = nl_langinfo(CODESET);
utf_init = enc && strcasecmp(enc, "UTF-8")==0 ? 1 : -1;
}
if (utf_init==1)
/* UTF8 locales */
return escape_str_utf8(dst, src, bufsize, maxcells);
#endif
if(bufsize > *maxcells+1) bufsize=*maxcells+1; // FIXME: assumes 8-bit locale
2002-12-21 21:07:53 +08:00
for(;;){
2004-11-05 04:50:59 +08:00
if(my_cells >= *maxcells || my_bytes+1 >= bufsize)
break;
2002-02-02 06:47:29 +08:00
c = (unsigned char) *(src++);
2002-12-21 21:07:53 +08:00
if(!c) break;
if(codes[c]=='-') c='?';
2004-11-05 04:50:59 +08:00
my_cells++;
2002-12-21 21:07:53 +08:00
my_bytes++;
*(dst++) = c;
2002-02-02 06:47:29 +08:00
}
*(dst++) = '\0';
2004-11-05 04:50:59 +08:00
*maxcells -= my_cells;
2002-12-21 21:07:53 +08:00
return my_bytes; // bytes of text, excluding the NUL
2002-02-02 06:47:29 +08:00
}
2002-12-21 18:34:50 +08:00
/////////////////////////////////////////////////
2002-02-02 06:47:29 +08:00
2002-12-21 18:34:50 +08:00
// escape an argv or environment string array
//
// bytes arg means sizeof(buf)
int escape_strlist(char *restrict dst, const char *restrict const *restrict src, size_t bytes, int *cells){
2002-02-02 06:47:29 +08:00
size_t i = 0;
2002-12-21 18:34:50 +08:00
for(;;){
2004-11-05 04:50:59 +08:00
i += escape_str(dst+i, *src, bytes-i, cells);
2002-12-21 18:34:50 +08:00
if(bytes-i < 3) break; // need room for space, a character, and the NUL
2002-02-02 06:47:29 +08:00
src++;
2002-12-21 18:34:50 +08:00
if(!*src) break; // need something to print
2004-11-05 04:50:59 +08:00
if (*cells<=1) break; // need room for printed size of text
2002-12-21 18:34:50 +08:00
dst[i++] = ' ';
2004-11-05 04:50:59 +08:00
--*cells;
2002-02-02 06:47:29 +08:00
}
2004-11-05 04:50:59 +08:00
return i; // bytes, excluding the NUL
2002-12-21 18:34:50 +08:00
}
///////////////////////////////////////////////////
2004-11-05 04:50:59 +08:00
int escape_command(char *restrict const outbuf, const proc_t *restrict const pp, int bytes, int *cells, unsigned flags){
2004-07-15 09:17:15 +08:00
int overhead = 0;
2002-12-21 18:34:50 +08:00
int end = 0;
if(flags & ESC_ARGS){
const char **lc = (const char**)pp->cmdline;
2004-11-05 04:50:59 +08:00
if(lc && *lc) return escape_strlist(outbuf, lc, bytes, cells);
2002-12-21 18:34:50 +08:00
}
if(flags & ESC_BRACKETS){
overhead += 2;
}
if(flags & ESC_DEFUNCT){
if(pp->state=='Z') overhead += 10; // chars in " <defunct>"
else flags &= ~ESC_DEFUNCT;
}
2004-11-05 04:50:59 +08:00
if(overhead + 1 >= *cells){ // if no room for even one byte of the command name
2002-12-21 18:34:50 +08:00
// you'd damn well better have _some_ space
2004-11-05 04:50:59 +08:00
// outbuf[0] = '-'; // Oct23
2002-12-21 18:34:50 +08:00
outbuf[1] = '\0';
return 1;
}
if(flags & ESC_BRACKETS){
outbuf[end++] = '[';
}
2004-11-05 04:50:59 +08:00
*cells -= overhead;
end += escape_str(outbuf+end, pp->cmd, bytes-overhead, cells);
2002-12-21 18:34:50 +08:00
// Hmmm, do we want "[foo] <defunct>" or "[foo <defunct>]"?
if(flags & ESC_BRACKETS){
outbuf[end++] = ']';
}
if(flags & ESC_DEFUNCT){
memcpy(outbuf+end, " <defunct>", 10);
end += 10;
}
outbuf[end] = '\0';
2004-11-05 04:50:59 +08:00
return end; // bytes, not including the NUL
2002-02-02 06:47:29 +08:00
}