/android/import-contacts

To get this branch, use:
bzr branch http://bzr.ed.am/android/import-contacts

« back to all changes in this revision

Viewing changes to src/org/waxworlds/edam/importcontacts/VCFImporter.java

  • Committer: edam
  • Date: 2010-10-17 18:43:13 UTC
  • Revision ID: edam@waxworlds.org-20101017184313-y2m6gsdzctjq5wtl
- changed case on charset and encoding warning strings (it looked bad)
- properly handle quoted-printable unencoding (including multi-line values)
- ignore blank lines in vCard
- ignore empty properties in vCard

Show diffs side-by-side

added added

removed removed

67
67
                        // open directory
68
68
                        String location = prefs.getString( "location", "" );
69
69
                        File dir = new File( location );
70
 
                        if( !dir.exists() || !dir.isDirectory() )
 
70
                        if( !dir.exists() )
71
71
                                showError( R.string.error_locationnotfound );
72
72
 
73
 
                        // get files
74
 
                        class VCardFilter implements FilenameFilter {
75
 
                                public boolean accept( File dir, String name ) {
76
 
                                        return name.toLowerCase().endsWith( ".vcf" );
 
73
                        // directory, or file?
 
74
                        if( dir.isDirectory() )
 
75
                        {
 
76
                                // get files
 
77
                                class VCardFilter implements FilenameFilter {
 
78
                                        public boolean accept( File dir, String name ) {
 
79
                                                return name.toLowerCase().endsWith( ".vcf" );
 
80
                                        }
77
81
                                }
78
 
                        }
79
 
                        files = dir.listFiles( new VCardFilter() );
 
82
                                files = dir.listFiles( new VCardFilter() );
 
83
                        }
 
84
                        else
 
85
                        {
 
86
                                // use just this file
 
87
                                files = new File[ 1 ];
 
88
                                files[ 0 ] = dir;
 
89
                        }
80
90
                }
81
91
                catch( SecurityException e ) {
82
92
                        showError( R.string.error_locationpermissions );
128
138
 
129
139
                }
130
140
                catch( FileNotFoundException e ) {
131
 
                        showError( getText( R.string.error_filenotfound ) + file.getName() );
 
141
                        showError( getText( R.string.error_filenotfound ) +
 
142
                                file.getName() );
132
143
                }
133
144
                catch( IOException e ) {
134
145
                        showError( getText( R.string.error_ioerror ) + file.getName() );
152
163
                        importVCardFileContent( content.toString(), file.getName() );
153
164
                }
154
165
                catch( FileNotFoundException e ) {
155
 
                        showError( getText( R.string.error_filenotfound ) + file.getName() );
 
166
                        showError( getText( R.string.error_filenotfound ) +
 
167
                                file.getName() );
156
168
                }
157
169
                catch( IOException e ) {
158
170
                        showError( getText( R.string.error_ioerror ) + file.getName() );
162
174
        private void importVCardFileContent( String content, String fileName )
163
175
                        throws AbortImportException
164
176
        {
165
 
                // unfold RFC2425 section 5.8.1 folded lines, except that we must also
166
 
                // handle embedded Quoted-Printable encodings that have a trailing '='.
167
 
                // So we remove these first before doing RFC2425 unfolding.
168
 
                content = content.replaceAll( "=\n[ \\t]", "" )
169
 
                                .replaceAll( "\n[ \\t]", "" );
170
 
 
171
177
                // get lines and parse them
172
178
                String[] lines = content.split( "\n" );
173
179
                VCard vCard = null;
242
248
 
243
249
                private String _version = null;
244
250
                private Vector< String > _lines = null;
245
 
                private int _nameLevel = NAMELEVEL_NONE;
 
251
                private int _name_level = NAMELEVEL_NONE;
 
252
                private boolean _parser_in_multiline = false;
 
253
                private String _parser_current_name_and_params = null;
 
254
                private String _parser_buffered_value_so_far = "";
 
255
 
 
256
                protected class UnencodeResult
 
257
                {
 
258
                        private boolean _another_line_required;
 
259
                        private byte[] _bytes;
 
260
                        private int _num_bytes;
 
261
 
 
262
                        public UnencodeResult( boolean another_line_required, byte[] bytes,
 
263
                                int num_bytes )
 
264
                        {
 
265
                                _another_line_required = another_line_required;
 
266
                                _bytes = bytes;
 
267
                                _num_bytes = num_bytes;
 
268
                        }
 
269
 
 
270
                        public boolean isAnotherLineRequired()
 
271
                        {
 
272
                                return _another_line_required;
 
273
                        }
 
274
 
 
275
                        public byte[] getBytes()
 
276
                        {
 
277
                                return _bytes;
 
278
                        }
 
279
 
 
280
                        public int getNumBytes()
 
281
                        {
 
282
                                return _num_bytes;
 
283
                        }
 
284
                }
246
285
 
247
286
                @SuppressWarnings("serial")
248
287
                protected class ParseException extends Exception
266
305
                                throws ParseException, SkipContactException,
267
306
                                AbortImportException
268
307
                {
269
 
                        // get property halves
270
 
                        String[] props = line.split( ":" );
 
308
                        // ignore empty lines
 
309
                        if( line.trim() == "" ) return;
 
310
 
 
311
                        // split line into name and value parts (this may turn out to be
 
312
                        // unwanted if the line is a subsequent line in a multi-line
 
313
                        // value, but we have to do this now to check for and handle VCF
 
314
                        // versions first)
 
315
                        String[] props = line.split(  ":", 2 );
271
316
                        for( int i = 0; i < props.length; i++ )
272
317
                                props[ i ] = props[ i ].trim();
273
 
                        if( props.length < 2 ||
274
 
                                        props[ 0 ].length() < 1 || props[ 1 ].length() < 1 )
275
 
                                throw new ParseException( R.string.error_vcf_malformed );
276
318
 
 
319
                        // if we haven't yet got a version, we won't be paring anything!
277
320
                        if( _version == null )
278
321
                        {
279
 
                                if( props[ 0 ].equals( "VERSION" ) )
 
322
                                // is this a version?
 
323
                                if( props.length == 2 && props[ 0 ].equals( "VERSION" ) )
280
324
                                {
281
 
                                        // get version
 
325
                                        // yes, check/store it
282
326
                                        if( !props[ 1 ].equals( "2.1" ) &&
283
327
                                                        !props[ 1 ].equals( "3.0" ) )
284
328
                                                throw new ParseException( R.string.error_vcf_version );
292
336
                                }
293
337
                                else
294
338
                                {
295
 
                                        // stash this line till we have a version
 
339
                                        // no, so stash this line till we have a version
296
340
                                        if( _lines == null )
297
341
                                                _lines = new Vector< String >();
298
342
                                        _lines.add( line );
300
344
                        }
301
345
                        else
302
346
                        {
 
347
                                if( _parser_in_multiline )
 
348
                                {
 
349
                                        // if we're currently in a multi-line value, use the stored
 
350
                                        // property name and parameters
 
351
                                        props = new String[ 2 ];
 
352
                                        props[ 0 ] = _parser_current_name_and_params;
 
353
                                        props[ 1 ] = line.trim();
 
354
                                }
 
355
                                else
 
356
                                {
 
357
                                        // for normal lines, check the property name/value bits
 
358
                                        if( props.length < 2 || props[ 0 ].length() == 0 )
 
359
                                                throw new ParseException(
 
360
                                                        R.string.error_vcf_malformed );
 
361
 
 
362
                                        // ignore empty properties
 
363
                                        if( props[ 1 ].length() < 1 )
 
364
                                                return;
 
365
 
 
366
                                        // reset the saved multi-line state
 
367
                                        _parser_current_name_and_params = props[ 0 ];
 
368
                                        _parser_buffered_value_so_far = "";
 
369
                                }
 
370
 
303
371
                                // get parameter parts
304
372
                                String[] params = props[ 0 ].split( ";" );
305
373
                                for( int i = 0; i < params.length; i++ )
306
374
                                        params[ i ] = params[ i ].trim();
307
375
 
 
376
                                // parse charset and encoding parameters
 
377
                                String charset, encoding;
 
378
                                if( ( charset = checkParam( params, "CHARSET" ) ) != null &&
 
379
                                        !charset.equals( "UTF-8" ) && !charset.equals( "UTF-16" ) )
 
380
                                {
 
381
                                        throw new ParseException( R.string.error_vcf_charset );
 
382
                                }
 
383
                                if( ( encoding = checkParam( params, "ENCODING" ) ) != null &&
 
384
                                        !encoding.equals( "QUOTED-PRINTABLE" ) &&
 
385
                                        !encoding.equals( "8BIT" ) )
 
386
                                        //&& !encoding.equals( "BASE64" ) )
 
387
                                {
 
388
                                        throw new ParseException( R.string.error_vcf_encoding );
 
389
                                }
 
390
 
 
391
                                // do unencoding (or default to a fake unencoding result with
 
392
                                // the raw string)
 
393
                                UnencodeResult result;
 
394
                                if( encoding != null && encoding.equals( "QUOTED-PRINTABLE" ) )
 
395
                                        result = unencodeQuotedPrintable( props[ 1 ], charset );
 
396
//                              else if( encoding != null && encoding.equals( "BASE64" ) )
 
397
//                                      result = unencodeBase64( props[ 1 ], charset );
 
398
                                else
 
399
                                        result = new UnencodeResult( false, props[ 1 ].getBytes(),
 
400
                                                props[ 1 ].getBytes().length );
 
401
 
 
402
                                // process charset
 
403
                                try {
 
404
                                        props[ 1 ] = new String( result.getBytes(), 0,
 
405
                                                result.getNumBytes(),
 
406
                                                charset == null? "UTF-8" : charset );
 
407
                                } catch( UnsupportedEncodingException e ) {
 
408
                                        throw new ParseException( R.string.error_vcf_charset );
 
409
                                }
 
410
 
 
411
                                // handle multi-line requests
 
412
                                _parser_in_multiline = result.isAnotherLineRequired();
 
413
                                if( _parser_in_multiline ) {
 
414
                                        _parser_buffered_value_so_far += props[ 1 ];
 
415
                                        return;
 
416
                                }
 
417
 
 
418
                                // add on buffered multi-line content
 
419
                                String value = _parser_buffered_value_so_far + props[ 1 ];
 
420
 
308
421
                                // parse some properties
309
422
                                if( params[ 0 ].equals( "N" ) )
310
 
                                        parseN( params, props[ 1 ] );
 
423
                                        parseN( params, value );
311
424
                                else if( params[ 0 ].equals( "FN" ) )
312
 
                                        parseFN( params, props[ 1 ] );
 
425
                                        parseFN( params, value );
313
426
                                else if( params[ 0 ].equals( "ORG" ) )
314
 
                                        parseORG( params, props[ 1 ] );
 
427
                                        parseORG( params, value );
315
428
                                else if( params[ 0 ].equals( "TEL" ) )
316
 
                                        parseTEL( params, props[ 1 ] );
 
429
                                        parseTEL( params, value );
317
430
                                else if( params[ 0 ].equals( "EMAIL" ) )
318
 
                                        parseEMAIL( params, props[ 1 ] );
 
431
                                        parseEMAIL( params, value );
319
432
                        }
320
433
                }
321
434
 
324
437
                                AbortImportException
325
438
                {
326
439
                        // already got a better name?
327
 
                        if( _nameLevel >= NAMELEVEL_N ) return;
 
440
                        if( _name_level >= NAMELEVEL_N ) return;
328
441
 
329
442
                        // get name parts
330
443
                        String[] nameparts = value.split( ";" );
339
452
                                value += ( value.length() == 0? "" : " " ) + nameparts[ 0 ];
340
453
 
341
454
                        // set name
342
 
                        setName( undoCharsetAndEncoding( params, value ) );
343
 
                        _nameLevel = NAMELEVEL_N;
 
455
                        setName( value );
 
456
                        _name_level = NAMELEVEL_N;
344
457
 
345
458
                        // check now to see if we need to import this contact (to avoid
346
459
                        // parsing the rest of the vCard unnecessarily)
352
465
                                throws ParseException, SkipContactException
353
466
                {
354
467
                        // already got a better name?
355
 
                        if( _nameLevel >= NAMELEVEL_FN ) return;
 
468
                        if( _name_level >= NAMELEVEL_FN ) return;
356
469
 
357
470
                        // set name
358
 
                        setName( undoCharsetAndEncoding( params, value ) );
359
 
                        _nameLevel = NAMELEVEL_FN;
 
471
                        setName( value );
 
472
                        _name_level = NAMELEVEL_FN;
360
473
                }
361
474
 
362
475
                private void parseORG( String[] params, String value )
363
476
                                throws ParseException, SkipContactException
364
477
                {
365
478
                        // already got a better name?
366
 
                        if( _nameLevel >= NAMELEVEL_ORG ) return;
 
479
                        if( _name_level >= NAMELEVEL_ORG ) return;
367
480
 
368
481
                        // get org parts
369
482
                        String[] orgparts = value.split( ";" );
377
490
                                value = orgparts[ 0 ];
378
491
 
379
492
                        // set name
380
 
                        setName( undoCharsetAndEncoding( params, value ) );
381
 
                        _nameLevel = NAMELEVEL_ORG;
 
493
                        setName( value );
 
494
                        _name_level = NAMELEVEL_ORG;
382
495
                }
383
496
 
384
497
                private void parseTEL( String[] params, String value )
409
522
                }
410
523
 
411
524
                public void parseEMAIL( String[] params, String value )
 
525
                                throws ParseException
412
526
                {
413
527
                        if( value.length() == 0 ) return;
414
528
 
432
546
                                throw new ParseException( R.string.error_vcf_malformed );
433
547
 
434
548
                        //  missing name properties?
435
 
                        if( _nameLevel == NAMELEVEL_NONE )
 
549
                        if( _name_level == NAMELEVEL_NONE )
436
550
                                throw new ParseException( R.string.error_vcf_noname );
437
551
 
438
552
                        // check if we should import this one? If we've already got an 'N'-
439
553
                        // type name, this will already have been done by parseN() so we
440
554
                        // mustn't do this here (or it could prompt twice!)
441
 
                        if( _nameLevel < NAMELEVEL_N && !isImportRequired( getName() ) )
 
555
                        if( _name_level < NAMELEVEL_N && !isImportRequired( getName() ) )
442
556
                                throw new SkipContactException();
443
557
                }
444
558
 
445
 
                private String undoCharsetAndEncoding( String[] params, String value )
446
 
                                throws ParseException
447
 
                {
448
 
                        // check encoding/charset
449
 
                        String charset, encoding;
450
 
                        if( ( charset = checkParam( params, "CHARSET" ) ) != null &&
451
 
                                        !charset.equals( "UTF-8" ) && !charset.equals( "UTF-16" ) )
452
 
                                throw new ParseException( R.string.error_vcf_charset );
453
 
                        if( ( encoding = checkParam( params, "ENCODING" ) ) != null &&
454
 
                                        !encoding.equals( "QUOTED-PRINTABLE" ) )
455
 
                                throw new ParseException( R.string.error_vcf_encoding );
456
 
 
457
 
                        // do decoding?
458
 
                        if( encoding != null && encoding.equals( "QUOTED-PRINTABLE" ) )
459
 
                                return unencodeQuotedPrintable( value, charset );
460
 
 
461
 
                        // nothing to do!
462
 
                        return value;
463
 
                }
464
 
 
465
559
                private String checkParam( String[] params, String name )
466
560
                {
467
561
                        Pattern p = Pattern.compile( "^" + name + "[ \\t]*=[ \\t]*(.*)$" );
497
591
                        return types;
498
592
                }
499
593
 
500
 
                private String unencodeQuotedPrintable( String str, String charset )
 
594
                private UnencodeResult unencodeQuotedPrintable( String str, String charset )
501
595
                {
 
596
                        boolean another = false;
 
597
 
502
598
                        // default encoding scheme
503
599
                        if( charset == null ) charset = "UTF-8";
504
600
 
505
601
                        // unencode quoted-pritable encoding, as per RFC1521 section 5.1
506
602
                        byte[] bytes = new byte[ str.length() ];
507
603
                        int j = 0;
508
 
                        for( int i = 0; i < str.length(); i++, j++ ) {
 
604
                        for( int i = 0; i < str.length(); i++ )
 
605
                        {
 
606
                                // get next char and process...
509
607
                                char ch = str.charAt( i );
510
 
                                if( ch == '=' && i < str.length() - 2 ) {
 
608
                                if( ch == '=' && i < str.length() - 2 )
 
609
                                {
 
610
                                        // we found a =XX format byte, add it
511
611
                                        bytes[ j ] = (byte)(
512
612
                                                        Character.digit( str.charAt( i + 1 ), 16 ) * 16 +
513
613
                                                        Character.digit( str.charAt( i + 2 ), 16 ) );
514
614
                                        i += 2;
515
615
                                }
 
616
                                else if( ch == '=' && i == str.length() - 1 )
 
617
                                {
 
618
                                        // we found a '=' at the end of a line signifying a multi-
 
619
                                        // line string, so we don't add it.
 
620
                                        another = true;
 
621
                                        continue;
 
622
                                }
516
623
                                else
 
624
                                        // just a normal char...
517
625
                                        bytes[ j ] = (byte)ch;
 
626
                                j++;
518
627
                        }
519
 
                        try {
520
 
                                return new String( bytes, 0, j, charset );
521
 
                        } catch( UnsupportedEncodingException e ) { }
522
 
                        return null;
 
628
 
 
629
                        return new UnencodeResult( another, bytes, j );
523
630
                }
524
631
        }
525
632
}