#include "..\..\inc\swilib.h" #include "base64.h" #include "sf_mime.h" #include "decode.h" #include "leak_debug.h" char *br = "
", *zerostr = ""; extern int strncmp_nocase(const char *s1,const char *s2,unsigned int n); #pragma inline int is_space(int c) { return (c==' '?NULL:1); } #pragma inline int toupper(int c) { if ((c>='a')&&(c<='z')) c+='A'-'a'; return(c); } #define MIN(A,B) A=len) { doit=0; break; } unsigned int ch; ch = _sf_uc_bi[*(unsigned char *)str]; if(ch < B64_UNUSED) { pr[n] = ch; n++; str++; } else if(ch == B64_UNUSED) { str++; } else { doit = 0; break; } } if(doit == 0 && n < 4) { pr[n+2] = pr[n+1] = pr[n]='\0'; } *(ou+0) = (pr[0] << 2) | (pr[1] >> 4); *(ou+1) = (pr[1] << 4) | (pr[2] >> 2); *(ou+2) = (pr[2] << 6) | (pr[3] >> 0); ou = ou+((n * 3) >> 2); } while(doit); _sf_b64_len = (ou - output); if(size) *size = _sf_b64_len; *ou = '\0'; /* NUL-terminate */ return (debug_realloc(output,_sf_b64_len+1, "base64_decode (realloc)")); } #pragma inline int char_to_hex(int c) { if (c>='0' && c<='9') return c-'0'; if (c>='A' && c<='F') return c-'A'+10; if (c>='a' && c<='f') return c-'a'+10; return -1; } char * quoted_printable_decode(const char *str, size_t *size) { char *buf; char *s, *d; register int n; register int len; int c; if(!str) return 0; /* * Allocate sufficient space to hold decoded string. */ d=(char *)str; len=size?*size:strlen(str); s=buf=debug_malloc(len + 1, "quoted_printable_decode (1)"); if(!buf) /* ENOMEM? */ return 0; for(; *str && (str - d) 0) memcpy(d+d_ptr, prev_br, len); d_ptr += strlen(s) - (prev_br - s); d[d_ptr] = 0; return(d); } void strip_special(char *s) { int n = strlen(s); //сюда мы будем бросать кости char *d = (char*) debug_malloc(n+1, "strip_special (1)"); char *buf = d; for(int i = 0; i < n; i++) { if(s[i] == '&' && s[i+1] == '#') { int c = 0; for(i+=2; s[i] != ';'; i++) { c*=10; c+= s[i] - '0'; } *d++ = unicode2win(c); } else { *d++ = s[i]; } } *d = 0; strcpy(s,buf); debug_mfree(buf, "strip_special (1)"); } void strip_html(char *s) { int d_ptr = 0; char *script, *script_end, *s1, *s2; const char *valid = "abcdefghijklmnopqrstuvwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789$-_.+!*'(),%;:@&=/?абвгдеёжзийклмнопрстуфхцчшщъыьэюяАБВГДЕЁЖЗИЙКЛМНОПРСТУФХЦЧШЩЪЫЬЭЮЯ~#"; s1 = strreplace(s, "\r\n\r\n", br); s2 = s1; s1 = strreplace(s2, "
", br); debug_mfree(s2, "strip_html (11)"); s2 = s1; s1 = strreplace(s2, "", zerostr); debug_mfree(s2, "strip_html (12)"); s2 = s1; s1 = strreplace(s2, "\r\r", br); debug_mfree(s2, "strip_html (13)"); s2 = s1; s1 = strreplace(s2, "\n\n", br); debug_mfree(s2, "strip_html (14)"); s2 = s1; s1 = strreplace(s2, "\n", "
"); debug_mfree(s2, "strip_html (15)"); s2 = s1; s1 = strreplace(s2, "\r", "
"); debug_mfree(s2, "strip_html (16)"); s2 = s1; s1 = strreplace(s2, "

", br); debug_mfree(s2, "strip_html (17)"); s2 = s1; s1 = strreplace(s2, "

", br); debug_mfree(s2, "strip_html (1)"); s2 = s1; s1 = strreplace(s2, "\r", "
"); debug_mfree(s2, "strip_html (18)"); s2 = s1; s1 = strreplace(s2, "\n", "
"); debug_mfree(s2, "strip_html (19)"); s2 = s1; s1 = strreplace(s2, "

", br); debug_mfree(s2, "strip_html (20)"); s2 = s1; //Заменим ссылки char *a = strstr(s1, "")+1; //ищем конец открывающего тега ea = strstr(he, ""); //и начало закрывающего rpl = strstr(he, " rpl) { a = rpl; continue; } if(ss && ea) //если не нашли - косяк { st1 = (char*)debug_malloc(he-hrf-5, "strip_html (a1)"); //выделяем память под промежуточные строки st2 = (char*)debug_malloc(ea-ss+1, "strip_html (a2)"); rpl = (char*)debug_malloc(ea-a+5, "strip_html (a3)"); memcpy(st1, hrf+6, he-hrf-6); st1[he-hrf-6] = 0; //копируем их туда memcpy(st2, ss, ea-ss); st2[ea-ss] = 0; memcpy(rpl, a, ea-a+4); rpl[ea-a+4] = 0; //что будем заменять ss = (char*)debug_malloc(strlen(st1) + strlen(st2) + 6, "strip_html (a4)"); memset(ss, 0, strlen(st1) + strlen(st2) + 6); if(strcmp(st1, st2)) snprintf(ss, strlen(st1) + strlen(st2) + 5, " %s {%s} ", st2, st1); // на что заменяем else snprintf(ss, strlen(st1) + strlen(st2) + 5, " {%s} ", st2, st1); // на что заменяем n = a-s1; //Найдём смещение, откуда плясать дальше s2 = strreplace(s1, rpl, ss); //Собственно замена debug_mfree(s1, "strip_html (a4)"); s1 = s2; //явки-пароли поменялись a = s1 + n; //дальше искать отсюда debug_mfree(ss, "strip_html (a4)"); //всем спасибо, все свободны debug_mfree(rpl, "strip_html (a3)"); debug_mfree(st2, "strip_html (a2)"); debug_mfree(st1, "strip_html (a1)"); } } if(ss) a = ss; a = strstr(a+1, ""); if(!script_end) break; script_end += strlen(""); strcpy(script, script_end); } while(script = strstr_nocase(s1, ""); if(!script_end) break; script_end += strlen(""); strcpy(script, script_end); } s2 = s1; s1 = strreplace(s2, br, "\r\n"); debug_mfree(s2, "strip_html (21)"); s2 = s1; s1 = strreplace(s2, "

", "\r\n"); debug_mfree(s2, "strip_html (23)"); s2 = s1; s1 = strreplace(s2, "", "/blockquote>\r\n"); debug_mfree(s2, "strip_html (25)"); s2 = s1; s1 = strreplace(s2, "", " "); debug_mfree(s2, "strip_html (26)"); s2 = s1; s1 = strreplace(s2, "", "\r\n"); debug_mfree(s2, "strip_html (27)"); s2 = s1; s1 = strreplace(s2, ""e;", "\""); debug_mfree(s2, "strip_html (28)"); s2 = s1; s1 = strreplace(s2, " ", " "); debug_mfree(s2, "strip_html (29)"); s2 = s1; s1 = strreplace(s2, "<", "<"); debug_mfree(s2, "strip_html (30)"); s2 = s1; s1 = strreplace(s2, ">", ">"); debug_mfree(s2, "strip_html (31)"); s2 = s1; s1 = strreplace(s2, "&", "&"); debug_mfree(s2, "strip_html (32)"); s2 = s1; s1 = strreplace(s2, "©", "(c)"); debug_mfree(s2, "strip_html (33)"); //сюда мы будем бросать кости char *d = (char*) debug_malloc(strlen(s)+1, "strip_html (1)"); //отфильтруем html - результат заведомо меньшей длины char *r = s1; d_ptr = 0; while(*r) { for(;*r && *r != '<'; r++) d[d_ptr++] = *r; for(;*r && *r != '>'; r++); if(*r) r++; } d[d_ptr] = 0; //вернём модифицированную строку в исходный буфер strcpy(s,d); debug_mfree(d, "strip_html (2)"); debug_mfree(s1, "strip_html (3)"); strip_special(s); } int get_charset(char *charset) { if (!strncmp_nocase(charset,"windows-1251",12)) return WIN_1251; if (!strncmp_nocase(charset,"koi8-r",6)) return KOI8_R; if (!strncmp_nocase(charset,"ISO-8859-5",10)) return ISO_8859_5; if (!strncmp_nocase(charset,"UTF-8",5)) return UTF_8; return WIN_1251; } char *unmime_header(const char *encoded_str, int default_charset) { const char *p = encoded_str; const char *eword_begin_p, *encoding_begin_p, *text_begin_p, *eword_end_p; char charset[32]; int encoding; char *conv_str; char *outbuf; char *out_str; size_t out_len; size_t decoded_len; out_len=strlen(encoded_str) * 2; outbuf = (char*) debug_malloc(out_len, "unmime_header (1)"); zeromem(outbuf,out_len); while (*p != '\0') { char *decoded_text = NULL; int len; eword_begin_p = strstr(p, ENCODED_WORD_BEGIN); if (!eword_begin_p) { char * curbuf = (char*) debug_malloc(strlen(p)+1, "unmime_header (2)"); switch(default_charset) { default: case WIN_1251: strcpy(curbuf,p); break; case KOI8_R: koi2win(curbuf,p); break; case ISO_8859_5: iso885952win(curbuf,p); break; case UTF_8: utf82win(curbuf,p); break; } strcat(outbuf, curbuf); debug_mfree(curbuf, "unmime_header (1)"); //strcat(outbuf, p); break; } encoding_begin_p = strchr(eword_begin_p + 2, '?'); if (!encoding_begin_p) { strcat(outbuf, p); break; } text_begin_p = strchr(encoding_begin_p + 1, '?'); if (!text_begin_p) { strcat(outbuf, p); break; } eword_end_p = strstr(text_begin_p + 1, ENCODED_WORD_END); if (!eword_end_p) { strcat(outbuf, p); break; } if (p == encoded_str) { strncat(outbuf, p, eword_begin_p - p); p = eword_begin_p; } else { /* ignore spaces between encoded words */ const char *sp; for (sp = p; sp < eword_begin_p; sp++) { if (!is_space(*sp)) { strncat(outbuf, p, eword_begin_p - p); p = eword_begin_p; break; } } } len = MIN(sizeof(charset) - 1, encoding_begin_p - (eword_begin_p + 2)); strncpy(charset, eword_begin_p + 2, len); charset[len] = '\0'; encoding = toupper(*(encoding_begin_p + 1)); if (encoding == 'B') { decoded_len=eword_end_p - (text_begin_p + 1); decoded_text = base64_decode(text_begin_p + 1,&decoded_len); } else if (encoding == 'Q') { decoded_len=eword_end_p - (text_begin_p + 1); decoded_text = quoted_printable_decode(text_begin_p + 1,&decoded_len); } else { strncat(outbuf, p, eword_end_p + 2 - p); p = eword_end_p + 2; continue; } switch(get_charset(charset)) { case WIN_1251: conv_str=(char*) debug_malloc(strlen(decoded_text)+1, "unmime_header (6)"); strcpy(conv_str,decoded_text); break; case KOI8_R: conv_str=(char*) debug_malloc(strlen(decoded_text)+1, "unmime_header (3)"); koi2win(conv_str,decoded_text); break; case ISO_8859_5: conv_str=(char*) debug_malloc(strlen(decoded_text)+1, "unmime_header (4)"); iso885952win(conv_str,decoded_text); break; case UTF_8: conv_str=(char*) debug_malloc(strlen(decoded_text)+1, "unmime_header (5)"); utf82win(conv_str,decoded_text); break; } strcat(outbuf, conv_str); debug_mfree(conv_str, "unmime_header (2)"); debug_mfree(decoded_text, "unmime_header (3)"); p = eword_end_p + 2; } out_str = outbuf; out_len = strlen(outbuf); return debug_realloc(out_str, out_len + 1, "unmime_header (1)"); }