Context Navigation

source: lib/misc.c @ 4c03881

Last change on this file since 4c03881 was 0f64ca7, checked in by Wilmer van der Gaast <wilmer@…>, at 2010-04-25T12:56:20Z
Make http_encode() RFC3986-compliant. (Escape everything except alphanumeric characters plus [-_~.].)
Property mode set to `100644`
File size: 14.0 KB

Line
1	/********************************************************************\
2	* BitlBee -- An IRC to other IM-networks gateway *
3	* *
4	* Copyright 2002-2006 Wilmer van der Gaast and others *
5	\********************************************************************/
6
7	/*
8	* Various utility functions. Some are copied from Gaim to support the
9	* IM-modules, most are from BitlBee.
10	*
11	* Copyright (C) 1998-1999, Mark Spencer <markster@marko.net>
12	* (and possibly other members of the Gaim team)
13	* Copyright 2002-2006 Wilmer van der Gaast <wilmer@gaast.net>
14	*/
15
16	/*
17	This program is free software; you can redistribute it and/or modify
18	it under the terms of the GNU General Public License as published by
19	the Free Software Foundation; either version 2 of the License, or
20	(at your option) any later version.
21
22	This program is distributed in the hope that it will be useful,
23	but WITHOUT ANY WARRANTY; without even the implied warranty of
24	MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
25	GNU General Public License for more details.
26
27	You should have received a copy of the GNU General Public License with
28	the Debian GNU/Linux distribution in /usr/share/common-licenses/GPL;
29	if not, write to the Free Software Foundation, Inc., 59 Temple Place,
30	Suite 330, Boston, MA 02111-1307 USA
31	*/
32
33	#define BITLBEE_CORE
34	#include "nogaim.h"
35	#include "base64.h"
36	#include "md5.h"
37	#include <stdio.h>
38	#include <stdlib.h>
39	#include <string.h>
40	#include <ctype.h>
41	#include <glib.h>
42	#include <time.h>
43
44	#ifdef HAVE_RESOLV_A
45	#include <arpa/nameser.h>
46	#include <resolv.h>
47	#endif
48
49	#include "md5.h"
50	#include "ssl_client.h"
51
52	void strip_linefeed(gchar *text)
53	{
54	int i, j;
55	gchar *text2 = g_malloc(strlen(text) + 1);
56
57	for (i = 0, j = 0; text[i]; i++)
58	if (text[i] != '\r')
59	text2[j++] = text[i];
60	text2[j] = '\0';
61
62	strcpy(text, text2);
63	g_free(text2);
64	}
65
66	time_t get_time(int year, int month, int day, int hour, int min, int sec)
67	{
68	struct tm tm;
69
70	memset(&tm, 0, sizeof(struct tm));
71	tm.tm_year = year - 1900;
72	tm.tm_mon = month - 1;
73	tm.tm_mday = day;
74	tm.tm_hour = hour;
75	tm.tm_min = min;
76	tm.tm_sec = sec >= 0 ? sec : time(NULL) % 60;
77
78	return mktime(&tm);
79	}
80
81	time_t mktime_utc( struct tm *tp )
82	{
83	struct tm utc;
84	time_t res, tres;
85
86	tp->tm_isdst = -1;
87	res = mktime( tp );
88	/* Problem is, mktime() just gave us the GMT timestamp for the
89	given local time... While the given time WAS NOT local. So
90	we should fix this now.
91
92	Now I could choose between messing with environment variables
93	(kludgy) or using timegm() (not portable)... Or doing the
94	following, which I actually prefer...
95
96	tzset() may also work but in other places I actually want to
97	use local time.
98
99	FFFFFFFFFFFFFFFFFFFFFUUUUUUUUUUUUUUUUUUUU!! */
100	gmtime_r( &res, &utc );
101	utc.tm_isdst = -1;
102	if( utc.tm_hour == tp->tm_hour && utc.tm_min == tp->tm_min )
103	/* Sweet! We're in UTC right now... */
104	return res;
105
106	tres = mktime( &utc );
107	res += res - tres;
108
109	/* Yes, this is a hack. And it will go wrong around DST changes.
110	BUT this is more likely to be threadsafe than messing with
111	environment variables, and possibly more portable... */
112
113	return res;
114	}
115
116	typedef struct htmlentity
117	{
118	char code[7];
119	char is[3];
120	} htmlentity_t;
121
122	static const htmlentity_t ent[] =
123	{
124	{ "lt", "<" },
125	{ "gt", ">" },
126	{ "amp", "&" },
127	{ "apos", "'" },
128	{ "quot", "\"" },
129	{ "aacute", "á" },
130	{ "eacute", "é" },
131	{ "iacute", "é" },
132	{ "oacute", "ó" },
133	{ "uacute", "ú" },
134	{ "agrave", "à" },
135	{ "egrave", "è" },
136	{ "igrave", "ì" },
137	{ "ograve", "ò" },
138	{ "ugrave", "ù" },
139	{ "acirc", "â" },
140	{ "ecirc", "ê" },
141	{ "icirc", "î" },
142	{ "ocirc", "ô" },
143	{ "ucirc", "û" },
144	{ "auml", "ä" },
145	{ "euml", "ë" },
146	{ "iuml", "ï" },
147	{ "ouml", "ö" },
148	{ "uuml", "ü" },
149	{ "nbsp", " " },
150	{ "", "" }
151	};
152
153	void strip_html( char *in )
154	{
155	char *start = in;
156	char *out = g_malloc( strlen( in ) + 1 );
157	char s = out, cs;
158	int i, matched;
159
160	memset( out, 0, strlen( in ) + 1 );
161
162	while( *in )
163	{
164	if( in == '<' && ( isalpha( (in+1) ) \|\| *(in+1) == '/' ) )
165	{
166	/* If in points at a < and in+1 points at a letter or a slash, this is probably
167	a HTML-tag. Try to find a closing > and continue there. If the > can't be
168	found, assume that it wasn't a HTML-tag after all. */
169
170	cs = in;
171
172	while( in && in != '>' )
173	in ++;
174
175	if( *in )
176	{
177	if( g_strncasecmp( cs+1, "br", 2) == 0 )
178	*(s++) = '\n';
179	in ++;
180	}
181	else
182	{
183	in = cs;
184	(s++) = (in++);
185	}
186	}
187	else if( *in == '&' )
188	{
189	cs = ++in;
190	while( in && isalpha( in ) )
191	in ++;
192
193	if( *in == ';' ) in ++;
194	matched = 0;
195
196	for( i = 0; *ent[i].code; i ++ )
197	if( g_strncasecmp( ent[i].code, cs, strlen( ent[i].code ) ) == 0 )
198	{
199	int j;
200
201	for( j = 0; ent[i].is[j]; j ++ )
202	*(s++) = ent[i].is[j];
203
204	matched = 1;
205	break;
206	}
207
208	/* None of the entities were matched, so return the string */
209	if( !matched )
210	{
211	in = cs - 1;
212	(s++) = (in++);
213	}
214	}
215	else
216	{
217	(s++) = (in++);
218	}
219	}
220
221	strcpy( start, out );
222	g_free( out );
223	}
224
225	char escape_html( const char html )
226	{
227	const char *c = html;
228	GString *ret;
229	char *str;
230
231	if( html == NULL )
232	return( NULL );
233
234	ret = g_string_new( "" );
235
236	while( *c )
237	{
238	switch( *c )
239	{
240	case '&':
241	ret = g_string_append( ret, "&" );
242	break;
243	case '<':
244	ret = g_string_append( ret, "<" );
245	break;
246	case '>':
247	ret = g_string_append( ret, ">" );
248	break;
249	case '"':
250	ret = g_string_append( ret, """ );
251	break;
252	default:
253	ret = g_string_append_c( ret, *c );
254	}
255	c ++;
256	}
257
258	str = ret->str;
259	g_string_free( ret, FALSE );
260	return( str );
261	}
262
263	/* Decode%20a%20file%20name */
264	void http_decode( char *s )
265	{
266	char *t;
267	int i, j, k;
268
269	t = g_new( char, strlen( s ) + 1 );
270
271	for( i = j = 0; s[i]; i ++, j ++ )
272	{
273	if( s[i] == '%' )
274	{
275	if( sscanf( s + i + 1, "%2x", &k ) )
276	{
277	t[j] = k;
278	i += 2;
279	}
280	else
281	{
282	*t = 0;
283	break;
284	}
285	}
286	else
287	{
288	t[j] = s[i];
289	}
290	}
291	t[j] = 0;
292
293	strcpy( s, t );
294	g_free( t );
295	}
296
297	/* Warning: This one explodes the string. Worst-cases can make the string 3x its original size! */
298	/* This fuction is safe, but make sure you call it safely as well! */
299	void http_encode( char *s )
300	{
301	char *t;
302	int i, j;
303
304	t = g_strdup( s );
305
306	for( i = j = 0; t[i]; i ++, j ++ )
307	{
308	if( !isalnum( t[i] ) && !strchr( "._-~", t[i] ) )
309	{
310	sprintf( s + j, "%%%02X", ((unsigned char*)t)[i] );
311	j += 2;
312	}
313	else
314	{
315	s[j] = t[i];
316	}
317	}
318	s[j] = 0;
319
320	g_free( t );
321	}
322
323	/* Strip newlines from a string. Modifies the string passed to it. */
324	char strip_newlines( char source )
325	{
326	int i;
327
328	for( i = 0; source[i] != '\0'; i ++ )
329	if( source[i] == '\n' \|\| source[i] == '\r' )
330	source[i] = ' ';
331
332	return source;
333	}
334
335	/* Wrap an IPv4 address into IPv6 space. Not thread-safe... */
336	char ipv6_wrap( char src )
337	{
338	static char dst[64];
339	int i;
340
341	for( i = 0; src[i]; i ++ )
342	if( ( src[i] < '0' \|\| src[i] > '9' ) && src[i] != '.' )
343	break;
344
345	/* Hmm, it's not even an IP... */
346	if( src[i] )
347	return src;
348
349	g_snprintf( dst, sizeof( dst ), "::ffff:%s", src );
350
351	return dst;
352	}
353
354	/* Unwrap an IPv4 address into IPv6 space. Thread-safe, because it's very simple. :-) */
355	char ipv6_unwrap( char src )
356	{
357	int i;
358
359	if( g_strncasecmp( src, "::ffff:", 7 ) != 0 )
360	return src;
361
362	for( i = 7; src[i]; i ++ )
363	if( ( src[i] < '0' \|\| src[i] > '9' ) && src[i] != '.' )
364	break;
365
366	/* Hmm, it's not even an IP... */
367	if( src[i] )
368	return src;
369
370	return ( src + 7 );
371	}
372
373	/* Convert from one charset to another.
374
375	from_cs, to_cs: Source and destination charsets
376	src, dst: Source and destination strings
377	size: Size if src. 0 == use strlen(). strlen() is not reliable for UNICODE/UTF16 strings though.
378	maxbuf: Maximum number of bytes to write to dst
379
380	Returns the number of bytes written to maxbuf or -1 on an error.
381	*/
382	signed int do_iconv( char from_cs, char to_cs, char src, char dst, size_t size, size_t maxbuf )
383	{
384	GIConv cd;
385	size_t res;
386	size_t inbytesleft, outbytesleft;
387	char *inbuf = src;
388	char *outbuf = dst;
389
390	cd = g_iconv_open( to_cs, from_cs );
391	if( cd == (GIConv) -1 )
392	return( -1 );
393
394	inbytesleft = size ? size : strlen( src );
395	outbytesleft = maxbuf - 1;
396	res = g_iconv( cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft );
397	*outbuf = '\0';
398	g_iconv_close( cd );
399
400	if( res == (size_t) -1 )
401	return( -1 );
402	else
403	return( outbuf - dst );
404	}
405
406	/* A pretty reliable random number generator. Tries to use the /dev/random
407	devices first, and falls back to the random number generator from libc
408	when it fails. Opens randomizer devices with O_NONBLOCK to make sure a
409	lack of entropy won't halt BitlBee. */
410	void random_bytes( unsigned char *buf, int count )
411	{
412	#ifndef _WIN32
413	static int use_dev = -1;
414
415	/* Actually this probing code isn't really necessary, is it? */
416	if( use_dev == -1 )
417	{
418	if( access( "/dev/random", R_OK ) == 0 \|\| access( "/dev/urandom", R_OK ) == 0 )
419	use_dev = 1;
420	else
421	{
422	use_dev = 0;
423	srand( ( getpid() << 16 ) ^ time( NULL ) );
424	}
425	}
426
427	if( use_dev )
428	{
429	int fd;
430
431	/* At least on Linux, /dev/random can block if there's not
432	enough entropy. We really don't want that, so if it can't
433	give anything, use /dev/urandom instead. */
434	if( ( fd = open( "/dev/random", O_RDONLY \| O_NONBLOCK ) ) >= 0 )
435	if( read( fd, buf, count ) == count )
436	{
437	close( fd );
438	return;
439	}
440	close( fd );
441
442	/* urandom isn't supposed to block at all, but just to be
443	sure. If it blocks, we'll disable use_dev and use the libc
444	randomizer instead. */
445	if( ( fd = open( "/dev/urandom", O_RDONLY \| O_NONBLOCK ) ) >= 0 )
446	if( read( fd, buf, count ) == count )
447	{
448	close( fd );
449	return;
450	}
451	close( fd );
452
453	/* If /dev/random blocks once, we'll still try to use it
454	again next time. If /dev/urandom also fails for some
455	reason, stick with libc during this session. */
456
457	use_dev = 0;
458	srand( ( getpid() << 16 ) ^ time( NULL ) );
459	}
460
461	if( !use_dev )
462	#endif
463	{
464	int i;
465
466	/* Possibly the LSB of rand() isn't very random on some
467	platforms. Seems okay on at least Linux and OSX though. */
468	for( i = 0; i < count; i ++ )
469	buf[i] = rand() & 0xff;
470	}
471	}
472
473	int is_bool( char *value )
474	{
475	if( *value == 0 )
476	return 0;
477
478	if( ( g_strcasecmp( value, "true" ) == 0 ) \|\| ( g_strcasecmp( value, "yes" ) == 0 ) \|\| ( g_strcasecmp( value, "on" ) == 0 ) )
479	return 1;
480	if( ( g_strcasecmp( value, "false" ) == 0 ) \|\| ( g_strcasecmp( value, "no" ) == 0 ) \|\| ( g_strcasecmp( value, "off" ) == 0 ) )
481	return 1;
482
483	while( *value )
484	if( !isdigit( *value ) )
485	return 0;
486	else
487	value ++;
488
489	return 1;
490	}
491
492	int bool2int( char *value )
493	{
494	int i;
495
496	if( ( g_strcasecmp( value, "true" ) == 0 ) \|\| ( g_strcasecmp( value, "yes" ) == 0 ) \|\| ( g_strcasecmp( value, "on" ) == 0 ) )
497	return 1;
498	if( ( g_strcasecmp( value, "false" ) == 0 ) \|\| ( g_strcasecmp( value, "no" ) == 0 ) \|\| ( g_strcasecmp( value, "off" ) == 0 ) )
499	return 0;
500
501	if( sscanf( value, "%d", &i ) == 1 )
502	return i;
503
504	return 0;
505	}
506
507	struct ns_srv_reply srv_lookup( char service, char protocol, char domain )
508	{
509	struct ns_srv_reply *reply = NULL;
510	#ifdef HAVE_RESOLV_A
511	char name[1024];
512	unsigned char querybuf[1024];
513	const unsigned char *buf;
514	ns_msg nsh;
515	ns_rr rr;
516	int i, len, size;
517
518	g_snprintf( name, sizeof( name ), "_%s._%s.%s", service, protocol, domain );
519
520	if( ( size = res_query( name, ns_c_in, ns_t_srv, querybuf, sizeof( querybuf ) ) ) <= 0 )
521	return NULL;
522
523	if( ns_initparse( querybuf, size, &nsh ) != 0 )
524	return NULL;
525
526	if( ns_parserr( &nsh, ns_s_an, 0, &rr ) != 0 )
527	return NULL;
528
529	size = ns_rr_rdlen( rr );
530	buf = ns_rr_rdata( rr );
531
532	len = 0;
533	for( i = 6; i < size && buf[i]; i += buf[i] + 1 )
534	len += buf[i] + 1;
535
536	if( i > size )
537	return NULL;
538
539	reply = g_malloc( sizeof( struct ns_srv_reply ) + len );
540	memcpy( reply->name, buf + 7, len );
541
542	for( i = buf[6]; i < len && buf[7+i]; i += buf[7+i] + 1 )
543	reply->name[i] = '.';
544
545	if( i > len )
546	{
547	g_free( reply );
548	return NULL;
549	}
550
551	reply->prio = ( buf[0] << 8 ) \| buf[1];
552	reply->weight = ( buf[2] << 8 ) \| buf[3];
553	reply->port = ( buf[4] << 8 ) \| buf[5];
554	#endif
555
556	return reply;
557	}
558
559	/* Word wrapping. Yes, I know this isn't UTF-8 clean. I'm willing to take the risk. */
560	char word_wrap( const char msg, int line_len )
561	{
562	GString *ret = g_string_sized_new( strlen( msg ) + 16 );
563
564	while( strlen( msg ) > line_len )
565	{
566	int i;
567
568	/* First try to find out if there's a newline already. Don't
569	want to add more splits than necessary. */
570	for( i = line_len; i > 0 && msg[i] != '\n'; i -- );
571	if( msg[i] == '\n' )
572	{
573	g_string_append_len( ret, msg, i + 1 );
574	msg += i + 1;
575	continue;
576	}
577
578	for( i = line_len; i > 0; i -- )
579	{
580	if( msg[i] == '-' )
581	{
582	g_string_append_len( ret, msg, i + 1 );
583	g_string_append_c( ret, '\n' );
584	msg += i + 1;
585	break;
586	}
587	else if( msg[i] == ' ' )
588	{
589	g_string_append_len( ret, msg, i );
590	g_string_append_c( ret, '\n' );
591	msg += i + 1;
592	break;
593	}
594	}
595	if( i == 0 )
596	{
597	g_string_append_len( ret, msg, line_len );
598	g_string_append_c( ret, '\n' );
599	msg += line_len;
600	}
601	}
602	g_string_append( ret, msg );
603
604	return g_string_free( ret, FALSE );
605	}
606
607	gboolean ssl_sockerr_again( void *ssl )
608	{
609	if( ssl )
610	return ssl_errno == SSL_AGAIN;
611	else
612	return sockerr_again();
613	}
614
615	/* Returns values: -1 == Failure (base64-decoded to something unexpected)
616	0 == Okay
617	1 == Password doesn't match the hash. */
618	int md5_verify_password( char password, char hash )
619	{
620	md5_byte_t *pass_dec = NULL;
621	md5_byte_t pass_md5[16];
622	md5_state_t md5_state;
623	int ret = -1, i;
624
625	if( base64_decode( hash, &pass_dec ) == 21 )
626	{
627	md5_init( &md5_state );
628	md5_append( &md5_state, (md5_byte_t*) password, strlen( password ) );
629	md5_append( &md5_state, (md5_byte_t) pass_dec + 16, 5 ); / Hmmm, salt! */
630	md5_finish( &md5_state, pass_md5 );
631
632	for( i = 0; i < 16; i ++ )
633	{
634	if( pass_dec[i] != pass_md5[i] )
635	{
636	ret = 1;
637	break;
638	}
639	}
640
641	/* If we reached the end of the loop, it was a match! */
642	if( i == 16 )
643	ret = 0;
644	}
645
646	g_free( pass_dec );
647
648	return ret;
649	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats: