/android/import-contacts

To get this branch, use:
bzr branch http://bzr.ed.am/android/import-contacts

« back to all changes in this revision

Viewing changes to src/am/ed/importcontacts/VcardImporter.java

  • Committer: edam
  • Date: 2012-12-21 14:47:57 UTC
  • Revision ID: tim@ed.am-20121221144757-5cb1lgsp7fdt7p2n
updated TODO

Show diffs side-by-side

added added

removed removed

1
1
/*
2
2
 * VCFImporter.java
3
3
 *
4
 
 * Copyright (C) 2009 to 2013 Tim Marston <tim@ed.am>
 
4
 * Copyright (C) 2009 to 2011 Tim Marston <tim@ed.am>
5
5
 *
6
6
 * This file is part of the Import Contacts program (hereafter referred
7
 
 * to as "this program").  For more information, see
 
7
 * to as "this program"). For more information, see
8
8
 * http://ed.am/dev/android/import-contacts
9
9
 *
10
10
 * This program is free software: you can redistribute it and/or modify
133
133
                        boolean in_vcard = false;
134
134
                        while( ( line = reader.readLine() ) != null )
135
135
                        {
136
 
                                if( !in_vcard )
137
 
                                {
 
136
                                if( !in_vcard ) {
138
137
                                        // look for vcard beginning
139
 
                                        if( line.matches( "(?i)BEGIN[ \t]*:[ \t]*VCARD.*" ) ) {
 
138
                                        if( line.matches( "^BEGIN:VCARD" ) ) {
140
139
                                                in_vcard = true;
141
140
                                                _vcard_count++;
142
141
                                        }
143
 
                                        // check for vMsg files
144
 
                                        else if( line.matches( "(?i)BEGIN[ \t]*:[ \t]*VMSG.*" ) ) {
145
 
                                                showError( getText( R.string.error_vcf_vmsgfile )
146
 
                                                        + file.getName() );
147
 
                                        }
148
142
                                }
149
 
                                else if( line.matches( "(?i)END[ \t]*:[ \t]*VCARD.*" ) )
 
143
                                else if( line.matches( "^END:VCARD" ) )
150
144
                                        in_vcard = false;
151
145
                        }
152
 
                        reader.close();
153
146
 
154
147
                }
155
148
                catch( FileNotFoundException e ) {
177
170
                        FileInputStream istream = new FileInputStream( file );
178
171
                        byte[] content = new byte[ (int)file.length() ];
179
172
                        istream.read( content );
180
 
                        istream.close();
 
173
                        istream = null;
181
174
 
182
175
                        // import
183
176
                        importVCardFileContent( content, file.getName() );
184
177
                }
185
 
                catch( OutOfMemoryError e ) {
186
 
                        showError( R.string.error_outofmemory );
187
 
                }
188
178
                catch( FileNotFoundException e ) {
189
179
                        showError( getText( R.string.error_filenotfound ) +
190
180
                                file.getName() );
203
193
                ContentLineIterator cli = new ContentLineIterator( content );
204
194
                while( cli.hasNext() )
205
195
                {
206
 
                        ContentLine content_line = cli.next();
 
196
                        ByteBuffer buffer = cli.next();
207
197
 
208
 
                        // get a US-ASCII version of the string, for processing
209
 
                        String line = content_line.getUsAsciiLine();
 
198
                        // get a US-ASCII version of the line for processing
 
199
                        String line;
 
200
                        try {
 
201
                                line = new String( buffer.array(), buffer.position(),
 
202
                                        buffer.limit() - buffer.position(), "US-ASCII" );
 
203
                        }
 
204
                        catch( UnsupportedEncodingException e ) {
 
205
                                // we know US-ASCII *is* supported, so appease the compiler...
 
206
                                line = "";
 
207
                        }
210
208
 
211
209
                        if( vcard == null ) {
212
210
                                // look for vcard beginning
213
 
                                if( line.matches( "(?i)BEGIN[ \t]*:[ \t]*VCARD.*" ) ) {
 
211
                                if( line.matches( "^BEGIN[ \t]*:[ \t]*VCARD" ) ) {
214
212
                                        setProgress( _progress++ );
215
213
                                        vcard = new Vcard();
216
214
                                        vcard_start_line = cli.getLineNumber();
218
216
                        }
219
217
                        else {
220
218
                                // look for vcard content or ending
221
 
                                if( line.matches( "(?i)END[ \t]*:[ \t]*VCARD.*" ) )
 
219
                                if( line.matches( "^END[ \t]*:[ \t]*VCARD" ) )
222
220
                                {
223
221
                                        // finalise the vcard/contact
224
222
                                        try {
261
259
                                {
262
260
                                        // try giving the line to the vcard
263
261
                                        try {
264
 
                                                vcard.parseLine( content_line );
 
262
                                                vcard.parseLine( buffer, line,
 
263
                                                        cli.doesNextLineLookFolded() );
265
264
                                        }
266
265
                                        catch( Vcard.ParseException e ) {
267
266
                                                skipContact();
274
273
                                                        finish( ACTION_ABORT );
275
274
                                                }
276
275
 
277
 
                                                // Although we're continuing, we still need to abort
278
 
                                                // this vCard.  Further lines will be ignored until we
 
276
                                                // although we're continuing, we still need to abort
 
277
                                                // this vCard. Further lines will be ignored until we
279
278
                                                // get to another BEGIN:VCARD line.
280
279
                                                vcard = null;
281
280
                                        }
282
281
                                        catch( Vcard.SkipImportException e ) {
283
282
                                                skipContact();
284
 
                                                // Abort this vCard.  Further lines will be ignored until
 
283
                                                // abort this vCard. Further lines will be ignored until
285
284
                                                // we get to another BEGIN:VCARD line.
286
285
                                                vcard = null;
287
286
                                        }
290
289
                }
291
290
        }
292
291
 
293
 
        class ContentLine
294
 
        {
295
 
                private ByteBuffer _buffer;
296
 
                private boolean _folded_next;
297
 
                private String _line;
298
 
 
299
 
                public ContentLine( ByteBuffer buffer, boolean folded_next )
300
 
                {
301
 
                        _buffer = buffer;
302
 
                        _folded_next = folded_next;
303
 
                        _line = null;
304
 
                }
305
 
 
306
 
                public ByteBuffer getBuffer()
307
 
                {
308
 
                        return _buffer;
309
 
                }
310
 
 
311
 
                public boolean doesNextLineLookFolded()
312
 
                {
313
 
                        return _folded_next;
314
 
                }
315
 
 
316
 
                public String getUsAsciiLine()
317
 
                {
318
 
                        // generated line and cache it
319
 
                        if( _line == null ) {
320
 
                                try {
321
 
                                        _line = new String( _buffer.array(), _buffer.position(),
322
 
                                                _buffer.limit() - _buffer.position(), "US-ASCII" );
323
 
                                }
324
 
                                catch( UnsupportedEncodingException e ) {
325
 
                                        // we know US-ASCII *is* supported, so appease the
326
 
                                        // compiler...
327
 
                                }
328
 
                        }
329
 
 
330
 
                        // return cached line
331
 
                        return _line;
332
 
                }
333
 
        }
334
 
 
335
 
        class ContentLineIterator implements Iterator< ContentLine >
 
292
        class ContentLineIterator implements Iterator< ByteBuffer >
336
293
        {
337
294
                protected byte[] _content = null;
338
295
                protected int _pos = 0;
350
307
                }
351
308
 
352
309
                @Override
353
 
                public ContentLine next()
 
310
                public ByteBuffer next()
354
311
                {
355
312
                        int initial_pos = _pos;
356
313
 
363
320
                                                _pos > initial_pos )? _pos - 1 : _pos;
364
321
                                        _pos++;
365
322
                                        _line++;
366
 
                                        return new ContentLine(
367
 
                                                ByteBuffer.wrap( _content, initial_pos,
368
 
                                                        to - initial_pos ),
369
 
                                                doesNextLineLookFolded() );
 
323
                                        return ByteBuffer.wrap( _content, initial_pos,
 
324
                                                to - initial_pos );
370
325
                                }
371
326
 
372
327
                        // we didn't find one, but were there bytes left?
374
329
                                int to = _pos;
375
330
                                _pos++;
376
331
                                _line++;
377
 
                                return new ContentLine(
378
 
                                        ByteBuffer.wrap( _content, initial_pos,
379
 
                                                to - initial_pos ),
380
 
                                        doesNextLineLookFolded() );
 
332
                                return ByteBuffer.wrap( _content, initial_pos,
 
333
                                        to - initial_pos );
381
334
                        }
382
335
 
383
336
                        // no bytes left
395
348
                 * onto the end of this one?
396
349
                 * @return
397
350
                 */
398
 
                private boolean doesNextLineLookFolded()
 
351
                public boolean doesNextLineLookFolded()
399
352
                {
400
353
                        return _pos > 0 && _pos < _content.length &&
401
354
                                _content[ _pos - 1 ] == '\n' &&
420
373
                private final static int MULTILINE_FOLDED = 3;  // MIME-DIR folding
421
374
 
422
375
                private String _version = null;
423
 
                private Vector< ContentLine > _content_lines = null;
 
376
                private Vector< ByteBuffer > _buffers = null;
424
377
                private int _name_level = NAMELEVEL_NONE;
425
378
                private int _parser_multiline_state = MULTILINE_NONE;
426
379
                private String _parser_current_name_and_params = null;
469
422
                @SuppressWarnings("serial")
470
423
                protected class SkipImportException extends Exception { }
471
424
 
472
 
                private String extractCollonPartFromLine( ContentLine content_line,
473
 
                        boolean former )
 
425
                private String extractCollonPartFromLine( ByteBuffer buffer,
 
426
                        String line, boolean former )
474
427
                {
 
428
                        String ret = null;
 
429
 
 
430
                        // get a US-ASCII version of the line for processing, unless we were
 
431
                        // supplied with one
 
432
                        if( line == null ) {
 
433
                                try {
 
434
                                        line = new String( buffer.array(), buffer.position(),
 
435
                                                buffer.limit() - buffer.position(), "US-ASCII" );
 
436
                                }
 
437
                                catch( UnsupportedEncodingException e ) {
 
438
                                        // we know US-ASCII is supported, so appease the compiler...
 
439
                                        line = "";
 
440
                                }
 
441
                        }
 
442
 
475
443
                        // split line into name and value parts and check to make sure we
476
444
                        // only got 2 parts and that the first part is not zero in length
477
 
                        String[] parts = content_line.getUsAsciiLine().split( ":", 2 );
 
445
                        String[] parts = line.split( ":", 2 );
478
446
                        if( parts.length == 2 && parts[ 0 ].length() > 0 )
479
 
                                return parts[ former? 0 : 1 ].trim();
480
 
 
481
 
                        return null;
482
 
                }
483
 
 
484
 
                private String extractNameAndParamsFromLine( ContentLine content_line )
485
 
                {
486
 
                        return extractCollonPartFromLine( content_line, true );
487
 
                }
488
 
 
489
 
                private String extractValueFromLine( ContentLine content_line )
490
 
                {
491
 
                        return extractCollonPartFromLine( content_line, false );
492
 
                }
493
 
 
494
 
                public void parseLine( ContentLine content_line )
 
447
                                ret = parts[ former? 0 : 1 ];
 
448
 
 
449
                        return ret;
 
450
                }
 
451
 
 
452
                private String extractNameAndParamsFromLine( ByteBuffer buffer,
 
453
                        String line )
 
454
                {
 
455
                        return extractCollonPartFromLine( buffer, line, true );
 
456
                }
 
457
 
 
458
                private String extractValueFromLine( ByteBuffer buffer, String line )
 
459
                {
 
460
                        return extractCollonPartFromLine( buffer, line, false );
 
461
                }
 
462
 
 
463
                public void parseLine( ByteBuffer buffer, String line,
 
464
                        boolean next_line_looks_folded )
495
465
                        throws ParseException, SkipImportException,
496
466
                        AbortImportException
497
467
                {
500
470
                        {
501
471
                                // tentatively get name and params from line
502
472
                                String name_and_params =
503
 
                                        extractNameAndParamsFromLine( content_line );
 
473
                                        extractNameAndParamsFromLine( buffer, line );
504
474
 
505
475
                                // is it a version line?
506
476
                                if( name_and_params != null &&
507
477
                                        name_and_params.equalsIgnoreCase( "VERSION" ) )
508
478
                                {
509
479
                                        // yes, get it!
510
 
                                        String value = extractValueFromLine( content_line );
511
 
                                        if( value == null || (
512
 
                                                !value.equals( "2.1" ) && !value.equals( "3.0" ) ) )
513
 
                                        {
 
480
                                        String value = extractValueFromLine( buffer, line );
 
481
                                        if( !value.equals( "2.1" ) && !value.equals( "3.0" ) )
514
482
                                                throw new ParseException( R.string.error_vcf_version );
515
 
                                        }
516
483
                                        _version = value;
517
484
 
518
485
                                        // parse any buffers we've been accumulating while we waited
519
486
                                        // for a version
520
 
                                        if( _content_lines != null )
521
 
                                                for( int i = 0; i < _content_lines.size(); i++ )
522
 
                                                        parseLine( _content_lines.get( i ) );
523
 
                                        _content_lines = null;
 
487
                                        if( _buffers != null )
 
488
                                                for( int i = 0; i < _buffers.size(); i++ )
 
489
                                                        parseLine( _buffers.get( i ), null,
 
490
                                                                i + 1 < _buffers.size() &&
 
491
                                                                _buffers.get( i + 1 ).hasRemaining() &&
 
492
                                                                _buffers.get( i + 1 ).get(
 
493
                                                                        _buffers.get( i + 1 ).position() ) == ' ' );
 
494
                                        _buffers = null;
524
495
                                }
525
496
                                else
526
497
                                {
527
498
                                        // no, so stash this line till we get a version
528
 
                                        if( _content_lines == null )
529
 
                                                _content_lines = new Vector< ContentLine >();
530
 
                                        _content_lines.add( content_line );
 
499
                                        if( _buffers == null )
 
500
                                                _buffers = new Vector< ByteBuffer >();
 
501
                                        _buffers.add( buffer );
531
502
                                }
532
503
                        }
533
504
                        else
545
516
 
546
517
                                        // skip some initial line characters, depending on the type
547
518
                                        // of multi-line we're handling
548
 
                                        pos = content_line.getBuffer().position();
 
519
                                        pos = buffer.position();
549
520
                                        switch( _parser_multiline_state )
550
521
                                        {
551
522
                                        case MULTILINE_FOLDED:
552
523
                                                pos++;
553
524
                                                break;
554
525
                                        case MULTILINE_ENCODED:
555
 
                                                while( pos < content_line.getBuffer().limit() && (
556
 
                                                        content_line.getBuffer().get( pos ) == ' ' ||
557
 
                                                        content_line.getBuffer().get( pos ) == '\t' ) )
 
526
                                                while( pos < buffer.limit() && (
 
527
                                                        buffer.get( pos ) == ' ' ||
 
528
                                                        buffer.get( pos ) == '\t' ) )
558
529
                                                {
559
530
                                                        pos++;
560
531
                                                }
570
541
                                else
571
542
                                {
572
543
                                        // skip empty lines
573
 
                                        if( content_line.getUsAsciiLine().trim().length() == 0 )
574
 
                                                return;
 
544
                                        if( line.trim().length() == 0 ) return;
575
545
 
576
546
                                        // get name and params from line, and since we're not
577
547
                                        // parsing a subsequent line in a multi-line, this should
578
548
                                        // not fail, or it's an error
579
549
                                        name_and_params =
580
 
                                                extractNameAndParamsFromLine( content_line );
 
550
                                                extractNameAndParamsFromLine( buffer, line );
581
551
                                        if( name_and_params == null )
582
552
                                                throw new ParseException(
583
553
                                                        R.string.error_vcf_malformed );
584
554
 
585
555
                                        // calculate how many chars to skip from beginning of line
586
556
                                        // so we skip the property "name:" part
587
 
                                        pos = content_line.getBuffer().position() +
588
 
                                                name_and_params.length() + 1;
 
557
                                        pos = buffer.position() + name_and_params.length() + 1;
589
558
 
590
559
                                        // reset the saved multi-line state
591
560
                                        _parser_current_name_and_params = name_and_params;
594
563
 
595
564
                                // get value from buffer, as raw bytes
596
565
                                ByteBuffer value;
597
 
                                value = ByteBuffer.wrap( content_line.getBuffer().array(), pos,
598
 
                                        content_line.getBuffer().limit() - pos );
 
566
                                value = ByteBuffer.wrap( buffer.array(), pos,
 
567
                                        buffer.limit() - pos );
599
568
 
600
569
                                // get parameter parts
601
570
                                String[] name_param_parts = name_and_params.split( ";", -1 );
689
658
                                // if we know we're not in an encoding-based multi-line, check
690
659
                                // to see if we're in a folded multi-line
691
660
                                if( _parser_multiline_state == MULTILINE_NONE &&
692
 
                                        content_line.doesNextLineLookFolded() )
 
661
                                        next_line_looks_folded )
693
662
                                {
694
663
                                        _parser_multiline_state = MULTILINE_FOLDED;
695
664
                                }
725
694
                                        parseLABEL( name_param_parts, complete_value );
726
695
                                else if( name_param_parts[ 0 ].equalsIgnoreCase( "NOTE" ) )
727
696
                                        parseNOTE( name_param_parts, complete_value );
728
 
                                else if( name_param_parts[ 0 ].equalsIgnoreCase( "BDAY" ) )
729
 
                                        parseBDAY( name_param_parts, complete_value );
730
697
                        }
731
698
                }
732
699
 
756
723
                        {
757
724
                                String str = parts.get( a );
758
725
 
759
 
                                // Look for parts that end in an escape character, but ignore
760
 
                                // the final part.  We've already detected escape chars at the
 
726
                                // look for parts that end in an escape character, but ignore
 
727
                                // the final part. We've already detected escape chars at the
761
728
                                // end of the final part in parseLine() and handled multi-lines
762
729
                                // accordingly.
763
730
                                if( a < parts.size() - 1 &&
853
820
                                        for( int b = 0; b < name_part_parts.length; b++ )
854
821
                                                if( name_part_parts[ b ].length() > 0 )
855
822
                                                {
856
 
                                                        if( value.length() > 0 ) value += " ";
 
823
                                                        if( value.length() == 0 ) value += " ";
857
824
                                                        value += name_part_parts[ b ];
858
825
                                                }
859
826
                                }
1033
1000
                        addNote( unescapeValue( value ) );
1034
1001
                }
1035
1002
 
1036
 
                private void parseBDAY( String[] params, String value )
1037
 
                {
1038
 
                        setBirthday( value );
1039
 
                }
1040
 
 
1041
1003
                public void finaliseVcard()
1042
1004
                        throws ParseException, ContactNotIdentifiableException
1043
1005
                {
1044
1006
                        // missing version (and data is present)
1045
 
                        if( _version == null && _content_lines != null )
 
1007
                        if( _version == null && _buffers != null )
1046
1008
                                throw new ParseException( R.string.error_vcf_malformed );
1047
1009
 
1048
1010
                        // finalise the parent class
1051
1013
 
1052
1014
                /**
1053
1015
                 * Amongst the params, find the value of the first, only, of any with
1054
 
                 * the specified name.
1055
 
                 *
 
1016
                 * the specified name
1056
1017
                 * @param params
1057
1018
                 * @param name
1058
1019
                 * @return a value, or null
1064
1025
                }
1065
1026
 
1066
1027
                /**
1067
 
                 * Amongst the params, find the values of any with the specified name.
1068
 
                 *
 
1028
                 * Amongst the params, find the values of any with the specified name
1069
1029
                 * @param params
1070
1030
                 * @param name
1071
1031
                 * @return an array of values, or null
1087
1047
                }
1088
1048
 
1089
1049
                /**
1090
 
                 * Amongst the params, return any type values present.  For v2.1 vCards,
1091
 
                 * those types are just parameters.  For v3.0, they are prefixed with
1092
 
                 * "TYPE=".  There may also be multiple type parameters.
1093
 
                 *
 
1050
                 * Amongst the params, return any type values present. For v2.1 vCards,
 
1051
                 * those types are just parameters. For v3.0, they are prefixed with
 
1052
                 * "TYPE=". There may also be multiple type parameters.
1094
1053
                 * @param params an array of params to look for types in
1095
1054
                 * @param valid_types an list of upper-case type values to look for
1096
1055
                 * @return a set of present type values
1148
1107
                                else if( ch == '=' && i == in.limit() - 1 )
1149
1108
                                {
1150
1109
                                        // we found a '=' at the end of a line signifying a multi-
1151
 
                                        // line string, so we don't add it
 
1110
                                        // line string, so we don't add it.
1152
1111
                                        another = true;
1153
1112
                                        continue;
1154
1113
                                }