/android/import-contacts

To get this branch, use:
bzr branch http://bzr.ed.am/android/import-contacts

« back to all changes in this revision

Viewing changes to src/org/waxworlds/edam/importcontacts/VCFImporter.java

  • Committer: edam
  • Date: 2011-05-02 18:28:24 UTC
  • Revision ID: edam@waxworlds.org-20110502182824-acgdi3qfxfzqgely
- fixed logic for vcard field types (home, work, cell, etc) so it works
- updated NEWS and TODO
- rewrote most of ContactsCache, including a new ContactIdentifier class to identify contacts in the cache and new cache building code
- contacts now identified in the same way that Andoid displays them (by name, or organisation, or number, or email, in that order)
- propper handling and support for organisations and titles
- validation of imported contact now done by Importer, not VcfImporter
- separated sanitisation and normalisation (for cache lookups)
- generacised PhoneData, EmailData and AddressData classes
- ContactData is now aware of primary numbers, emails and organisations (defaults to the first prefrred one seen, or the first one seen where none is preferred)

Show diffs side-by-side

added added

removed removed

1
1
/*
2
2
 * VCFImporter.java
3
3
 *
4
 
 * Copyright (C) 2009 Tim Marston <edam@waxworlds.org>
 
4
 * Copyright (C) 2009 to 2011 Tim Marston <edam@waxworlds.org>
5
5
 *
6
6
 * This file is part of the Import Contacts program (hereafter referred
7
7
 * to as "this program"). For more information, see
25
25
 
26
26
import java.io.BufferedReader;
27
27
import java.io.File;
 
28
import java.io.FileInputStream;
28
29
import java.io.FileNotFoundException;
29
30
import java.io.FileReader;
30
31
import java.io.FilenameFilter;
31
32
import java.io.IOException;
32
33
import java.io.UnsupportedEncodingException;
 
34
import java.nio.ByteBuffer;
 
35
import java.util.ArrayList;
33
36
import java.util.Arrays;
 
37
import java.util.HashMap;
34
38
import java.util.HashSet;
 
39
import java.util.Iterator;
35
40
import java.util.List;
 
41
import java.util.NoSuchElementException;
36
42
import java.util.Set;
37
43
import java.util.Vector;
38
44
import java.util.regex.Matcher;
39
45
import java.util.regex.Pattern;
40
46
 
 
47
import org.waxworlds.edam.importcontacts.Importer.ContactData.ExtraDetail;
 
48
 
41
49
import android.content.SharedPreferences;
42
50
import android.provider.Contacts;
43
51
import android.provider.Contacts.PhonesColumns;
118
126
                {
119
127
                        // open file
120
128
                        BufferedReader reader = new BufferedReader(
121
 
                                        new FileReader( file ) );
 
129
                                new FileReader( file ) );
122
130
 
123
131
                        // read
124
132
                        String line;
127
135
                        {
128
136
                                if( !inVCard ) {
129
137
                                        // look for vcard beginning
130
 
                                        if( line.matches( "^BEGIN[ \\t]*:[ \\t]*VCARD" ) ) {
 
138
                                        if( line.matches( "^BEGIN:VCARD" ) ) {
131
139
                                                inVCard = true;
132
140
                                                _vCardCount++;
133
141
                                        }
134
142
                                }
135
 
                                else if( line.matches( "^END[ \\t]*:[ \\t]*VCARD" ) )
 
143
                                else if( line.matches( "^END:VCARD" ) )
136
144
                                        inVCard = false;
137
145
                        }
138
146
 
148
156
 
149
157
        private void importVCardFile( File file ) throws AbortImportException
150
158
        {
 
159
                // check file is good
 
160
                if( !file.exists() )
 
161
                        showError( getText( R.string.error_filenotfound ) +
 
162
                                file.getName() );
 
163
                if( file.length() == 0 )
 
164
                        showError( getText( R.string.error_fileisempty ) +
 
165
                                file.getName() );
 
166
 
151
167
                try
152
168
                {
153
 
                        // open file
154
 
                        BufferedReader reader = new BufferedReader(
155
 
                                        new FileReader( file ) );
156
 
 
157
 
                        // read
158
 
                        StringBuffer content = new StringBuffer();
159
 
                        String line;
160
 
                        while( ( line = reader.readLine() ) != null )
161
 
                                content.append( line ).append( "\n" );
162
 
 
163
 
                        importVCardFileContent( content.toString(), file.getName() );
 
169
                        // open/read file
 
170
                        FileInputStream istream = new FileInputStream( file );
 
171
                        byte[] content = new byte[ (int)file.length() ];
 
172
                        istream.read( content );
 
173
 
 
174
                        // import
 
175
                        importVCardFileContent( content, file.getName() );
164
176
                }
165
177
                catch( FileNotFoundException e ) {
166
178
                        showError( getText( R.string.error_filenotfound ) +
171
183
                }
172
184
        }
173
185
 
174
 
        private void importVCardFileContent( String content, String fileName )
175
 
                        throws AbortImportException
 
186
        private void importVCardFileContent( byte[] content, String fileName )
 
187
                throws AbortImportException
176
188
        {
177
 
                // get lines and parse them
178
 
                String[] lines = content.split( "\n" );
 
189
                // go through lines
179
190
                VCard vCard = null;
180
 
                for( int i = 0; i < lines.length; i++ )
 
191
                ContentLineIterator cli = new ContentLineIterator( content );
 
192
                while( cli.hasNext() )
181
193
                {
182
 
                        String line = lines[ i ];
 
194
                        ByteBuffer buffer = cli.next();
 
195
 
 
196
                        // get a US-ASCII version of the line for processing
 
197
                        String line;
 
198
                        try {
 
199
                                line = new String( buffer.array(), buffer.position(),
 
200
                                        buffer.limit() - buffer.position(), "US-ASCII" );
 
201
                        }
 
202
                        catch( UnsupportedEncodingException e ) {
 
203
                                // we know US-ASCII is supported, so appease the compiler...
 
204
                                line = "";
 
205
                        }
183
206
 
184
207
                        if( vCard == null ) {
185
208
                                // look for vcard beginning
186
 
                                if( line.matches( "^BEGIN[ \\t]*:[ \\t]*VCARD" ) ) {
 
209
                                if( line.matches( "^BEGIN:VCARD" ) ) {
187
210
                                        setProgress( ++_progress );
188
211
                                        vCard = new VCard();
189
212
                                }
190
213
                        }
191
214
                        else {
192
215
                                // look for vcard content or ending
193
 
                                if( line.matches( "^END[ \\t]*:[ \\t]*VCARD" ) )
 
216
                                if( line.matches( "^END:VCARD" ) )
194
217
                                {
195
218
                                        // store vcard and do away with it
196
219
                                        try {
200
223
                                        catch( VCard.ParseException e ) {
201
224
                                                skipContact();
202
225
                                                if( !showContinue(
203
 
                                                                getText( R.string.error_vcf_parse ).toString()
204
 
                                                                + fileName + "\n" + e.getMessage() ) )
 
226
                                                        getText( R.string.error_vcf_parse ).toString()
 
227
                                                        + fileName + "\n" + e.getMessage() ) )
 
228
                                                {
205
229
                                                        finish( ACTION_ABORT );
 
230
                                                }
206
231
                                        }
207
232
                                        catch( VCard.SkipContactException e ) {
208
233
                                                skipContact();
214
239
                                {
215
240
                                        // try giving the line to the vcard
216
241
                                        try {
217
 
                                                vCard.parseLine( line );
 
242
                                                vCard.parseLine( buffer, line,
 
243
                                                        cli.doesNextLineLookFolded() );
218
244
                                        }
219
245
                                        catch( VCard.ParseException e ) {
220
246
                                                skipContact();
221
247
                                                if( !showContinue(
222
 
                                                                getText( R.string.error_vcf_parse ).toString()
223
 
                                                                + fileName + "\n" + e.getMessage() ) )
 
248
                                                        getText( R.string.error_vcf_parse ).toString()
 
249
                                                        + fileName + "\n" + e.getMessage() ) )
 
250
                                                {
224
251
                                                        finish( ACTION_ABORT );
 
252
                                                }
225
253
 
226
254
                                                // although we're continuing, we still need to abort
227
255
                                                // this vCard. Further lines will be ignored until we
239
267
                }
240
268
        }
241
269
 
 
270
        class ContentLineIterator implements Iterator< ByteBuffer >
 
271
        {
 
272
                protected byte[] _content = null;
 
273
                protected int _pos = 0;
 
274
 
 
275
                public ContentLineIterator( byte[] content )
 
276
                {
 
277
                        _content = content;
 
278
                }
 
279
 
 
280
                @Override
 
281
                public boolean hasNext()
 
282
                {
 
283
                        return _pos < _content.length;
 
284
                }
 
285
 
 
286
                @Override
 
287
                public ByteBuffer next()
 
288
                {
 
289
                        int initial_pos = _pos;
 
290
 
 
291
                        // find newline
 
292
                        for( ; _pos < _content.length; _pos++ )
 
293
                                if( _content[ _pos ] == '\n' )
 
294
                                {
 
295
                                        // adjust for a \r preceding the \n
 
296
                                        int to = ( _pos > 0 && _content[ _pos - 1 ] == '\r' &&
 
297
                                                _pos > initial_pos )? _pos - 1 : _pos;
 
298
                                        _pos++;
 
299
                                        return ByteBuffer.wrap( _content, initial_pos,
 
300
                                                to - initial_pos );
 
301
                                }
 
302
 
 
303
                        // we didn't find one, but were there bytes left?
 
304
                        if( _pos != initial_pos ) {
 
305
                                int to = _pos;
 
306
                                _pos++;
 
307
                                return ByteBuffer.wrap( _content, initial_pos,
 
308
                                        to - initial_pos );
 
309
                        }
 
310
 
 
311
                        // no bytes left
 
312
                        throw new NoSuchElementException();
 
313
                }
 
314
 
 
315
                @Override
 
316
                public void remove()
 
317
                {
 
318
                        throw new UnsupportedOperationException();
 
319
                }
 
320
 
 
321
                /**
 
322
                 * Does the next line, if there is one, look like it should be folded
 
323
                 * onto the end of this one?
 
324
                 * @return
 
325
                 */
 
326
                public boolean doesNextLineLookFolded()
 
327
                {
 
328
                        return _pos > 0 && _pos < _content.length &&
 
329
                                _content[ _pos - 1 ] == '\n' && _content[ _pos ] == ' ';
 
330
                }
 
331
        }
 
332
 
242
333
        private class VCard extends ContactData
243
334
        {
244
335
                private final static int NAMELEVEL_NONE = 0;
245
 
                private final static int NAMELEVEL_ORG = 1;
246
 
                private final static int NAMELEVEL_FN = 2;
247
 
                private final static int NAMELEVEL_N = 3;
 
336
                private final static int NAMELEVEL_FN = 1;
 
337
                private final static int NAMELEVEL_N = 2;
 
338
 
 
339
                private final static int MULTILINE_NONE = 0;
 
340
                private final static int MULTILINE_ENCODED = 1; // v2.1 quoted-printable
 
341
                private final static int MULTILINE_ESCAPED = 2; // v2.1 \\CRLF
 
342
                private final static int MULTILINE_FOLDED = 3;  // v3.0 folding
248
343
 
249
344
                private String _version = null;
250
 
                private Vector< String > _lines = null;
 
345
                private Vector< ByteBuffer > _buffers = null;
251
346
                private int _name_level = NAMELEVEL_NONE;
252
 
                private boolean _parser_in_multiline = false;
 
347
                private int _parser_multiline_state = MULTILINE_NONE;
253
348
                private String _parser_current_name_and_params = null;
254
349
                private String _parser_buffered_value_so_far = "";
 
350
                private String _cached_organisation = null;
 
351
                private String _cached_title = null;
255
352
 
256
353
                protected class UnencodeResult
257
354
                {
258
355
                        private boolean _another_line_required;
259
 
                        private byte[] _bytes;
260
 
                        private int _num_bytes;
 
356
                        private ByteBuffer _buffer;
261
357
 
262
 
                        public UnencodeResult( boolean another_line_required, byte[] bytes,
263
 
                                int num_bytes )
 
358
                        public UnencodeResult( boolean another_line_required,
 
359
                                ByteBuffer buffer )
264
360
                        {
265
361
                                _another_line_required = another_line_required;
266
 
                                _bytes = bytes;
267
 
                                _num_bytes = num_bytes;
 
362
                                _buffer = buffer;
268
363
                        }
269
364
 
270
365
                        public boolean isAnotherLineRequired()
272
367
                                return _another_line_required;
273
368
                        }
274
369
 
275
 
                        public byte[] getBytes()
276
 
                        {
277
 
                                return _bytes;
278
 
                        }
279
 
 
280
 
                        public int getNumBytes()
281
 
                        {
282
 
                                return _num_bytes;
 
370
                        public ByteBuffer getBuffer()
 
371
                        {
 
372
                                return _buffer;
283
373
                        }
284
374
                }
285
375
 
301
391
                @SuppressWarnings("serial")
302
392
                protected class SkipContactException extends Exception { }
303
393
 
304
 
                public void parseLine( String line )
305
 
                                throws ParseException, SkipContactException,
306
 
                                AbortImportException
307
 
                {
308
 
                        // ignore empty lines
309
 
                        if( line.trim() == "" ) return;
310
 
 
311
 
                        // split line into name and value parts (this may turn out to be
312
 
                        // unwanted if the line is a subsequent line in a multi-line
313
 
                        // value, but we have to do this now to check for and handle VCF
314
 
                        // versions first)
315
 
                        String[] props = line.split(  ":", 2 );
316
 
                        for( int i = 0; i < props.length; i++ )
317
 
                                props[ i ] = props[ i ].trim();
318
 
 
319
 
                        // if we haven't yet got a version, we won't be paring anything!
 
394
                private String extractCollonPartFromLine( ByteBuffer buffer,
 
395
                        String line, boolean former )
 
396
                {
 
397
                        String ret = null;
 
398
 
 
399
                        // get a US-ASCII version of the line for processing, unless we were
 
400
                        // supplied with one
 
401
                        if( line == null ) {
 
402
                                try {
 
403
                                        line = new String( buffer.array(), buffer.position(),
 
404
                                                buffer.limit() - buffer.position(), "US-ASCII" );
 
405
                                }
 
406
                                catch( UnsupportedEncodingException e ) {
 
407
                                        // we know US-ASCII is supported, so appease the compiler...
 
408
                                        line = "";
 
409
                                }
 
410
                        }
 
411
 
 
412
                        // split line into name and value parts and check to make sure we
 
413
                        // only got 2 parts and that the first part is not zero in length
 
414
                        String[] parts = line.split( ":", 2 );
 
415
                        if( parts.length == 2 && parts[ 0 ].length() > 0 )
 
416
                                ret = parts[ former? 0 : 1 ];
 
417
 
 
418
                        return ret;
 
419
                }
 
420
 
 
421
                private String extractNameAndParamsFromLine( ByteBuffer buffer,
 
422
                        String line )
 
423
                {
 
424
                        return extractCollonPartFromLine( buffer, line, true );
 
425
                }
 
426
 
 
427
                private String extractValueFromLine( ByteBuffer buffer, String line )
 
428
                {
 
429
                        return extractCollonPartFromLine( buffer, line, false );
 
430
                }
 
431
 
 
432
                public void parseLine( ByteBuffer buffer, String line,
 
433
                        boolean next_line_looks_folded )
 
434
                        throws ParseException, SkipContactException,
 
435
                        AbortImportException
 
436
                {
 
437
                        // do we have a version yet?
320
438
                        if( _version == null )
321
439
                        {
322
 
                                // is this a version?
323
 
                                if( props.length == 2 && props[ 0 ].equals( "VERSION" ) )
 
440
                                // tentatively get name and params from line
 
441
                                String name_and_params =
 
442
                                        extractNameAndParamsFromLine( buffer, line );
 
443
 
 
444
                                // is it a version line?
 
445
                                if( name_and_params != null &&
 
446
                                        name_and_params.equals( "VERSION" ) )
324
447
                                {
325
 
                                        // yes, check/store it
326
 
                                        if( !props[ 1 ].equals( "2.1" ) &&
327
 
                                                        !props[ 1 ].equals( "3.0" ) )
 
448
                                        // yes, get it!
 
449
                                        String value = extractValueFromLine( buffer, line );
 
450
                                        if( !value.equals( "2.1" ) && !value.equals( "3.0" ) )
328
451
                                                throw new ParseException( R.string.error_vcf_version );
329
 
                                        _version = props[ 1 ];
 
452
                                        _version = value;
330
453
 
331
 
                                        // parse any other lines we've accumulated so far
332
 
                                        if( _lines != null )
333
 
                                                for( int i = 0; i < _lines.size(); i++ )
334
 
                                                        parseLine( _lines.get( i ) );
335
 
                                        _lines = null;
 
454
                                        // parse any buffers we've been accumulating while we waited
 
455
                                        // for a version
 
456
                                        if( _buffers != null )
 
457
                                                for( int i = 0; i < _buffers.size(); i++ )
 
458
                                                        parseLine( _buffers.get( i ), null,
 
459
                                                                i + 1 < _buffers.size() &&
 
460
                                                                _buffers.get( i + 1 ).hasRemaining() &&
 
461
                                                                _buffers.get( i + 1 ).get(
 
462
                                                                        _buffers.get( i + 1 ).position() ) == ' ' );
 
463
                                        _buffers = null;
336
464
                                }
337
465
                                else
338
466
                                {
339
 
                                        // no, so stash this line till we have a version
340
 
                                        if( _lines == null )
341
 
                                                _lines = new Vector< String >();
342
 
                                        _lines.add( line );
 
467
                                        // no, so stash this line till we get a version
 
468
                                        if( _buffers == null )
 
469
                                                _buffers = new Vector< ByteBuffer >();
 
470
                                        _buffers.add( buffer );
343
471
                                }
344
472
                        }
345
473
                        else
346
474
                        {
347
 
                                if( _parser_in_multiline )
 
475
                                // name and params and the position in the buffer where the
 
476
                                // "value" part of the line start
 
477
                                String name_and_params;
 
478
                                int pos;
 
479
 
 
480
                                if( _parser_multiline_state != MULTILINE_NONE )
348
481
                                {
349
482
                                        // if we're currently in a multi-line value, use the stored
350
483
                                        // property name and parameters
351
 
                                        props = new String[ 2 ];
352
 
                                        props[ 0 ] = _parser_current_name_and_params;
353
 
                                        props[ 1 ] = line.trim();
 
484
                                        name_and_params = _parser_current_name_and_params;
 
485
 
 
486
                                        // skip some initial line characters, depending on the type
 
487
                                        // of multi-line we're handling
 
488
                                        pos = buffer.position();
 
489
                                        switch( _parser_multiline_state )
 
490
                                        {
 
491
                                        case MULTILINE_FOLDED:
 
492
                                                pos++;
 
493
                                                break;
 
494
                                        case MULTILINE_ENCODED:
 
495
                                                while( pos < buffer.limit() && (
 
496
                                                        buffer.get( pos ) == ' ' ||
 
497
                                                        buffer.get( pos ) == '\t' ) )
 
498
                                                {
 
499
                                                        pos++;
 
500
                                                }
 
501
                                                break;
 
502
                                        default:
 
503
                                                // do nothing
 
504
                                        }
 
505
 
 
506
                                        // take us out of multi-line so that we can re-detect that
 
507
                                        // this line is a multi-line or not
 
508
                                        _parser_multiline_state = MULTILINE_NONE;
354
509
                                }
355
510
                                else
356
511
                                {
357
 
                                        // for normal lines, check the property name/value bits
358
 
                                        if( props.length < 2 || props[ 0 ].length() == 0 )
 
512
                                        // get name and params from line, and since we're not
 
513
                                        // parsing a subsequent line in a multi-line, this should
 
514
                                        // not fail, or it's an error
 
515
                                        name_and_params =
 
516
                                                extractNameAndParamsFromLine( buffer, line );
 
517
                                        if( name_and_params == null )
359
518
                                                throw new ParseException(
360
519
                                                        R.string.error_vcf_malformed );
361
520
 
362
 
                                        // ignore empty properties
363
 
                                        if( props[ 1 ].length() < 1 )
364
 
                                                return;
 
521
                                        // calculate how many chars to skip from beginning of line
 
522
                                        // so we skip the property "name:" part
 
523
                                        pos = buffer.position() + name_and_params.length() + 1;
365
524
 
366
525
                                        // reset the saved multi-line state
367
 
                                        _parser_current_name_and_params = props[ 0 ];
 
526
                                        _parser_current_name_and_params = name_and_params;
368
527
                                        _parser_buffered_value_so_far = "";
369
528
                                }
370
529
 
 
530
                                // get value from buffer, as raw bytes
 
531
                                ByteBuffer value;
 
532
                                value = ByteBuffer.wrap( buffer.array(), pos,
 
533
                                        buffer.limit() - pos );
 
534
 
371
535
                                // get parameter parts
372
 
                                String[] params = props[ 0 ].split( ";" );
373
 
                                for( int i = 0; i < params.length; i++ )
374
 
                                        params[ i ] = params[ i ].trim();
 
536
                                String[] name_param_parts = name_and_params.split( ";", -1 );
 
537
                                for( int i = 0; i < name_param_parts.length; i++ )
 
538
                                        name_param_parts[ i ] = name_param_parts[ i ].trim();
375
539
 
376
 
                                // parse charset and encoding parameters
377
 
                                String charset, encoding;
378
 
                                if( ( charset = checkParam( params, "CHARSET" ) ) != null &&
379
 
                                        !charset.equals( "UTF-8" ) && !charset.equals( "UTF-16" ) )
380
 
                                {
381
 
                                        throw new ParseException( R.string.error_vcf_charset );
382
 
                                }
383
 
                                if( ( encoding = checkParam( params, "ENCODING" ) ) != null &&
384
 
                                        !encoding.equals( "QUOTED-PRINTABLE" ) &&
385
 
                                        !encoding.equals( "8BIT" ) )
 
540
                                // parse encoding parameter
 
541
                                String encoding = checkParam( name_param_parts, "ENCODING" );
 
542
                                if( encoding != null ) encoding = encoding.toUpperCase();
 
543
                                if( encoding != null && !encoding.equals( "8BIT" ) &&
 
544
                                        !encoding.equals( "QUOTED-PRINTABLE" ) )
386
545
                                        //&& !encoding.equals( "BASE64" ) )
387
546
                                {
388
547
                                        throw new ParseException( R.string.error_vcf_encoding );
389
548
                                }
390
549
 
 
550
                                // parse charset parameter
 
551
                                String charset = checkParam( name_param_parts, "CHARSET" );
 
552
                                if( charset != null ) charset = charset.toUpperCase();
 
553
                                if( charset != null && !charset.equals( "US-ASCII" ) &&
 
554
                                        !charset.equals( "ASCII" ) &&
 
555
                                        !charset.equals( "UTF-8" ) )
 
556
                                {
 
557
                                        throw new ParseException( R.string.error_vcf_charset );
 
558
                                }
 
559
 
391
560
                                // do unencoding (or default to a fake unencoding result with
392
561
                                // the raw string)
393
 
                                UnencodeResult result;
 
562
                                UnencodeResult unencoding_result = null;
394
563
                                if( encoding != null && encoding.equals( "QUOTED-PRINTABLE" ) )
395
 
                                        result = unencodeQuotedPrintable( props[ 1 ], charset );
 
564
                                        unencoding_result = unencodeQuotedPrintable( value );
396
565
//                              else if( encoding != null && encoding.equals( "BASE64" ) )
397
 
//                                      result = unencodeBase64( props[ 1 ], charset );
398
 
                                else
399
 
                                        result = new UnencodeResult( false, props[ 1 ].getBytes(),
400
 
                                                props[ 1 ].getBytes().length );
 
566
//                                      unencoding_result = unencodeBase64( props[ 1 ], charset );
 
567
                                if( unencoding_result != null ) {
 
568
                                        value = unencoding_result.getBuffer();
 
569
                                        if( unencoding_result.isAnotherLineRequired() )
 
570
                                                _parser_multiline_state = MULTILINE_ENCODED;
 
571
                                }
 
572
 
 
573
                                // convert 8-bit ASCII charset to US-ASCII
 
574
                                if( charset == null || charset.equals( "ASCII" ) ) {
 
575
                                        value = transcodeAsciiToUtf8( value );
 
576
                                        charset = "UTF-8";
 
577
                                }
401
578
 
402
579
                                // process charset
 
580
                                String string_value;
403
581
                                try {
404
 
                                        props[ 1 ] = new String( result.getBytes(), 0,
405
 
                                                result.getNumBytes(),
406
 
                                                charset == null? "UTF-8" : charset );
 
582
                                        string_value = new String( value.array(), value.position(),
 
583
                                                value.limit() - value.position(), charset );
407
584
                                } catch( UnsupportedEncodingException e ) {
408
585
                                        throw new ParseException( R.string.error_vcf_charset );
409
586
                                }
410
587
 
411
 
                                // handle multi-line requests
412
 
                                _parser_in_multiline = result.isAnotherLineRequired();
413
 
                                if( _parser_in_multiline ) {
414
 
                                        _parser_buffered_value_so_far += props[ 1 ];
 
588
                                // for some entries that have semicolon-separated value parts,
 
589
                                // check to see if the value ends in an escape character, which
 
590
                                // indicates that we have a multi-line value
 
591
                                if( ( name_param_parts[ 0 ].equals( "N" ) ||
 
592
                                        name_param_parts[ 0 ].equals( "ORG" ) ||
 
593
                                        name_param_parts[ 0 ].equals( "ADR" ) ) &&
 
594
                                        doesStringEndInAnEscapeChar( string_value ) )
 
595
                                {
 
596
                                        _parser_multiline_state = MULTILINE_ESCAPED;
 
597
                                        string_value = string_value.substring( 0,
 
598
                                                string_value.length() - 1 );
 
599
                                }
 
600
 
 
601
                                // now we know whether we're in an encoding multi-line,
 
602
                                // determine if we're in a v3 folded multi-line or not
 
603
                                if( _parser_multiline_state == MULTILINE_NONE &&
 
604
                                        _version.equals( "3.0" ) && next_line_looks_folded )
 
605
                                {
 
606
                                        _parser_multiline_state = MULTILINE_FOLDED;
 
607
                                }
 
608
 
 
609
                                // handle multi-lines by buffering them and parsing them when we
 
610
                                // are processing the last line in a multi-line sequence
 
611
                                if( _parser_multiline_state != MULTILINE_NONE ) {
 
612
                                        _parser_buffered_value_so_far += string_value;
415
613
                                        return;
416
614
                                }
 
615
                                String complete_value =
 
616
                                        ( _parser_buffered_value_so_far + string_value ).trim();
417
617
 
418
 
                                // add on buffered multi-line content
419
 
                                String value = _parser_buffered_value_so_far + props[ 1 ];
 
618
                                // ignore empty values
 
619
                                if( complete_value.length() < 1 ) return;
420
620
 
421
621
                                // parse some properties
422
 
                                if( params[ 0 ].equals( "N" ) )
423
 
                                        parseN( params, value );
424
 
                                else if( params[ 0 ].equals( "FN" ) )
425
 
                                        parseFN( params, value );
426
 
                                else if( params[ 0 ].equals( "ORG" ) )
427
 
                                        parseORG( params, value );
428
 
                                else if( params[ 0 ].equals( "TEL" ) )
429
 
                                        parseTEL( params, value );
430
 
                                else if( params[ 0 ].equals( "EMAIL" ) )
431
 
                                        parseEMAIL( params, value );
432
 
                        }
 
622
                                if( name_param_parts[ 0 ].equals( "N" ) )
 
623
                                        parseN( name_param_parts, complete_value );
 
624
                                else if( name_param_parts[ 0 ].equals( "FN" ) )
 
625
                                        parseFN( name_param_parts, complete_value );
 
626
                                else if( name_param_parts[ 0 ].equals( "ORG" ) )
 
627
                                        parseORG( name_param_parts, complete_value );
 
628
                                else if( name_param_parts[ 0 ].equals( "TITLE" ) )
 
629
                                        parseTITLE( name_param_parts, complete_value );
 
630
                                else if( name_param_parts[ 0 ].equals( "TEL" ) )
 
631
                                        parseTEL( name_param_parts, complete_value );
 
632
                                else if( name_param_parts[ 0 ].equals( "EMAIL" ) )
 
633
                                        parseEMAIL( name_param_parts, complete_value );
 
634
                                else if( name_param_parts[ 0 ].equals( "ADR" ) )
 
635
                                        parseADR( name_param_parts, complete_value );
 
636
                        }
 
637
                }
 
638
 
 
639
                private boolean doesStringEndInAnEscapeChar( String string )
 
640
                {
 
641
                        // count the number of backslashes at the end of the string
 
642
                        int count = 0;
 
643
                        for( int a = string.length() - 1; a >= 0; a-- )
 
644
                                if( string.charAt( a ) == '\\' )
 
645
                                        count++;
 
646
                                else
 
647
                                        break;
 
648
 
 
649
                        // if there are an even number of backslashes then the final one
 
650
                        // doesn't count
 
651
                        return ( count & 1 ) == 1;
 
652
                }
 
653
 
 
654
                private String[] splitValueBySemicolon( String value )
 
655
                {
 
656
                        // split string in to parts by semicolon
 
657
                        ArrayList< String > parts = new ArrayList< String >(
 
658
                                Arrays.asList( value.split(  ";" ) ) );
 
659
 
 
660
                        // go through parts
 
661
                        for( int a = 0; a < parts.size(); a++ )
 
662
                        {
 
663
                                String str = parts.get( a );
 
664
 
 
665
                                // look for parts that end in an escape character, but ignore
 
666
                                // the final part. We've already detected escape chars at the
 
667
                                // end of the final part in parseLine() and handled multi-lines
 
668
                                // accordingly.
 
669
                                if( a < parts.size() - 1 &&
 
670
                                        doesStringEndInAnEscapeChar( str ) )
 
671
                                {
 
672
                                        // join the next part to this part and remove the next part
 
673
                                        parts.set( a, str.substring( 0, str.length() - 1 ) +
 
674
                                                ';' + parts.get( a + 1 ) );
 
675
                                        parts.remove( a + 1 );
 
676
 
 
677
                                        // re-visit this part
 
678
                                        a--;
 
679
                                        continue;
 
680
                                }
 
681
 
 
682
                                // trim and replace string
 
683
                                str = str.trim();
 
684
                                parts.set( a, str );
 
685
                        }
 
686
 
 
687
                        String[] ret = new String[ parts.size() ];
 
688
                        return parts.toArray( ret );
433
689
                }
434
690
 
435
691
                private void parseN( String[] params, String value )
436
 
                                throws ParseException, SkipContactException,
437
 
                                AbortImportException
438
692
                {
439
693
                        // already got a better name?
440
694
                        if( _name_level >= NAMELEVEL_N ) return;
441
695
 
442
696
                        // get name parts
443
 
                        String[] nameparts = value.split( ";" );
444
 
                        for( int i = 0; i < nameparts.length; i++ )
445
 
                                nameparts[ i ] = nameparts[ i ].trim();
 
697
                        String[] name_parts = splitValueBySemicolon( value );
446
698
 
447
699
                        // build name
448
700
                        value = "";
449
 
                        if( nameparts.length > 1 && nameparts[ 1 ].length() > 0 )
450
 
                                value += nameparts[ 1 ];
451
 
                        if( nameparts[ 0 ].length() > 0 )
452
 
                                value += ( value.length() == 0? "" : " " ) + nameparts[ 0 ];
 
701
                        if( name_parts.length > 1 && name_parts[ 1 ].length() > 0 )
 
702
                                value += name_parts[ 1 ];
 
703
                        if( name_parts.length > 0 && name_parts[ 0 ].length() > 0 )
 
704
                                value += ( value.length() == 0? "" : " " ) + name_parts[ 0 ];
453
705
 
454
706
                        // set name
455
707
                        setName( value );
456
708
                        _name_level = NAMELEVEL_N;
457
 
 
458
 
                        // check now to see if we need to import this contact (to avoid
459
 
                        // parsing the rest of the vCard unnecessarily)
460
 
                        if( !isImportRequired( getName() ) )
461
 
                                throw new SkipContactException();
462
709
                }
463
710
 
464
711
                private void parseFN( String[] params, String value )
465
 
                                throws ParseException, SkipContactException
466
712
                {
467
713
                        // already got a better name?
468
714
                        if( _name_level >= NAMELEVEL_FN ) return;
473
719
                }
474
720
 
475
721
                private void parseORG( String[] params, String value )
476
 
                                throws ParseException, SkipContactException
477
722
                {
478
 
                        // already got a better name?
479
 
                        if( _name_level >= NAMELEVEL_ORG ) return;
480
 
 
481
723
                        // get org parts
482
 
                        String[] orgparts = value.split( ";" );
483
 
                        for( int i = 0; i < orgparts.length; i++ )
484
 
                                orgparts[ i ] = orgparts[ i ].trim();
485
 
 
486
 
                        // build name
487
 
                        if( orgparts[ 0 ].length() == 0 && orgparts.length > 1 )
488
 
                                value = orgparts[ 1 ];
489
 
                        else
490
 
                                value = orgparts[ 0 ];
491
 
 
492
 
                        // set name
493
 
                        setName( value );
494
 
                        _name_level = NAMELEVEL_ORG;
 
724
                        String[] org_parts = splitValueBySemicolon( value );
 
725
                        if( org_parts == null || org_parts.length < 1 ) return;
 
726
 
 
727
                        // build organisation name
 
728
                        StringBuilder builder = new StringBuilder(
 
729
                                String.valueOf( org_parts[ 0 ] ) );
 
730
                        for( int a = 1; a < org_parts.length; a++ )
 
731
                                builder.append( ", " ).append( org_parts[ a ] );
 
732
                        String organisation = builder.toString();
 
733
 
 
734
                        // set organisation name (using a title we've previously found)
 
735
                        addOrganisation( organisation, _cached_title, true );
 
736
 
 
737
                        // if we've not previously found a title, store this organisation
 
738
                        // name (we'll need it when we find a title to update the
 
739
                        // organisation, by name), else if we *have* previously found a
 
740
                        // title, clear it (since we just used it)
 
741
                        if( _cached_title == null )
 
742
                                _cached_organisation = organisation;
 
743
                        else
 
744
                                _cached_title = null;
 
745
                }
 
746
 
 
747
                private void parseTITLE( String[] params, String value )
 
748
                {
 
749
                        // if we previously had an organisation, look it up and append this
 
750
                        // title to it
 
751
                        if( _cached_organisation != null && hasOrganisations() ) {
 
752
                                HashMap< String, ExtraDetail > datas = getOrganisations();
 
753
                                ExtraDetail detail = datas.get( _cached_organisation );
 
754
                                if( detail != null )
 
755
                                        detail.setExtra( value );
 
756
                        }
 
757
 
 
758
                        // same as when handling organisation, if we've not previously found
 
759
                        // an organisation we store this title, else we clear it (since we
 
760
                        // just appended this title to it)
 
761
                        if( _cached_organisation == null )
 
762
                                _cached_title = value;
 
763
                        else
 
764
                                _cached_organisation = null;
495
765
                }
496
766
 
497
767
                private void parseTEL( String[] params, String value )
498
 
                                throws ParseException
499
768
                {
500
769
                        if( value.length() == 0 ) return;
501
770
 
502
771
                        Set< String > types = extractTypes( params, Arrays.asList(
503
 
                                        "PREF", "HOME", "WORK", "VOICE", "FAX", "MSG", "CELL",
504
 
                                        "PAGER", "BBS", "MODEM", "CAR", "ISDN", "VIDEO" ) );
 
772
                                "PREF", "HOME", "WORK", "VOICE", "FAX", "MSG", "CELL",
 
773
                                "PAGER", "BBS", "MODEM", "CAR", "ISDN", "VIDEO" ) );
505
774
 
506
775
                        // here's the logic...
507
776
                        boolean preferred = types.contains( "PREF" );
508
 
                        if( types.contains( "VOICE" ) )
509
 
                                if( types.contains( "WORK" ) )
510
 
                                        addPhone( value, PhonesColumns.TYPE_WORK, preferred );
511
 
                                else
512
 
                                        addPhone( value, PhonesColumns.TYPE_HOME, preferred );
513
 
                        else if( types.contains( "CELL" ) || types.contains( "VIDEO" ) )
514
 
                                addPhone( value, PhonesColumns.TYPE_MOBILE, preferred );
 
777
                        int type;
515
778
                        if( types.contains( "FAX" ) )
516
779
                                if( types.contains( "HOME" ) )
517
 
                                        addPhone( value, PhonesColumns.TYPE_FAX_HOME, preferred );
 
780
                                        type = PhonesColumns.TYPE_FAX_HOME;
518
781
                                else
519
 
                                        addPhone( value, PhonesColumns.TYPE_FAX_WORK, preferred );
520
 
                        if( types.contains( "PAGER" ) )
521
 
                                addPhone( value, PhonesColumns.TYPE_PAGER, preferred );
 
782
                                        type = PhonesColumns.TYPE_FAX_WORK;
 
783
                        else if( types.contains( "CELL" ) || types.contains( "VIDEO" ) )
 
784
                                type = PhonesColumns.TYPE_MOBILE;
 
785
                        else if( types.contains( "PAGER" ) )
 
786
                                type = PhonesColumns.TYPE_PAGER;
 
787
                        else if( types.contains( "WORK" ) )
 
788
                                type = PhonesColumns.TYPE_WORK;
 
789
                        else
 
790
                                type = PhonesColumns.TYPE_HOME;
 
791
 
 
792
                        // add phone number
 
793
                        addNumber( value, type, preferred );
522
794
                }
523
795
 
524
796
                public void parseEMAIL( String[] params, String value )
525
 
                                throws ParseException
526
797
                {
527
798
                        if( value.length() == 0 ) return;
528
799
 
529
800
                        Set< String > types = extractTypes( params, Arrays.asList(
530
 
                                        "PREF", "WORK", "HOME", "INTERNET" ) );
 
801
                                "PREF", "WORK", "HOME", "INTERNET" ) );
531
802
 
532
 
                        // here's the logic...
 
803
                        // add email address
533
804
                        boolean preferred = types.contains( "PREF" );
534
 
                        if( types.contains( "WORK" ) )
535
 
                                addEmail( value, Contacts.ContactMethods.TYPE_WORK, preferred );
536
 
                        else
537
 
                                addEmail( value, Contacts.ContactMethods.TYPE_HOME, preferred );
 
805
                        int type;
 
806
                        if( types.contains( "WORK" ) )
 
807
                                type = Contacts.ContactMethods.TYPE_WORK;
 
808
                        else
 
809
                                type = Contacts.ContactMethods.TYPE_HOME;
 
810
 
 
811
                        addEmail( value, type, preferred );
 
812
                }
 
813
 
 
814
                private void parseADR( String[] params, String value )
 
815
                {
 
816
                        // get address parts
 
817
                        String[] adr_parts = splitValueBySemicolon( value );
 
818
 
 
819
                        // build address
 
820
                        value = "";
 
821
                        for( int a = 0; a < adr_parts.length; a++ ) {
 
822
                                if( value.length() > 0 ) value += "\n";
 
823
                                value += adr_parts[ a ].trim();
 
824
                        }
 
825
 
 
826
                        Set< String > types = extractTypes( params, Arrays.asList(
 
827
                                "PREF", "WORK", "HOME", "INTERNET" ) );
 
828
 
 
829
                        // add address
 
830
                        int type;
 
831
                        if( types.contains( "WORK" ) )
 
832
                                type = Contacts.ContactMethods.TYPE_WORK;
 
833
                        else
 
834
                                type = Contacts.ContactMethods.TYPE_HOME;
 
835
 
 
836
                        addAddress( value, type );
538
837
                }
539
838
 
540
839
                public void finaliseParsing()
541
 
                                throws ParseException, SkipContactException,
542
 
                                AbortImportException
 
840
                        throws ParseException, SkipContactException,
 
841
                        AbortImportException
543
842
                {
544
843
                        // missing version (and data is present)
545
 
                        if( _version == null && _lines != null )
 
844
                        if( _version == null && _buffers != null )
546
845
                                throw new ParseException( R.string.error_vcf_malformed );
547
846
 
548
 
                        //  missing name properties?
549
 
                        if( _name_level == NAMELEVEL_NONE )
550
 
                                throw new ParseException( R.string.error_vcf_noname );
551
 
 
552
 
                        // check if we should import this one? If we've already got an 'N'-
553
 
                        // type name, this will already have been done by parseN() so we
554
 
                        // mustn't do this here (or it could prompt twice!)
555
 
                        if( _name_level < NAMELEVEL_N && !isImportRequired( getName() ) )
556
 
                                throw new SkipContactException();
 
847
                        // check if we should import this contact
 
848
                        try {
 
849
                                if( !isImportRequired( this ) )
 
850
                                        throw new SkipContactException();
 
851
                        }
 
852
                        catch( ContactNeedsMoreInfoException e ) {
 
853
                                throw new ParseException( R.string.error_vcf_notenoughinfo );
 
854
                        }
557
855
                }
558
856
 
559
857
                private String checkParam( String[] params, String name )
560
858
                {
561
 
                        Pattern p = Pattern.compile( "^" + name + "[ \\t]*=[ \\t]*(.*)$" );
 
859
                        Pattern p = Pattern.compile(
 
860
                                "^" + name + "[ \\t]*=[ \\t]*(\"?)(.*)\\1$" );
562
861
                        for( int i = 0; i < params.length; i++ ) {
563
862
                                Matcher m = p.matcher( params[ i ] );
564
863
                                if( m.matches() )
565
 
                                        return m.group( 1 );
 
864
                                        return m.group( 2 );
566
865
                        }
567
866
                        return null;
568
867
                }
569
868
 
570
869
                private Set< String > extractTypes( String[] params,
571
 
                                List< String > validTypes )
 
870
                        List< String > valid_types )
572
871
                {
573
872
                        HashSet< String > types = new HashSet< String >();
574
873
 
575
874
                        // get 3.0-style TYPE= param
576
 
                        String typeParam;
577
 
                        if( ( typeParam = checkParam( params, "TYPE" ) ) != null ) {
578
 
                                String[] bits = typeParam.split( "," );
579
 
                                for( int i = 0; i < bits.length; i++ )
580
 
                                        if( validTypes.contains( bits[ i ] ) )
581
 
                                                types.add( bits[ i ] );
 
875
                        String type_param;
 
876
                        if( ( type_param = checkParam( params, "TYPE" ) ) != null ) {
 
877
                                String[] parts = type_param.split( "," );
 
878
                                for( int i = 0; i < parts.length; i++ )
 
879
                                        if( valid_types.contains( parts[ i ] ) )
 
880
                                                types.add( parts[ i ] );
582
881
                        }
583
882
 
584
883
                        // get 2.1-style type param
585
884
                        if( _version.equals( "2.1" ) ) {
586
885
                                for( int i = 1; i < params.length; i++ )
587
 
                                        if( validTypes.contains( params[ i ] ) )
 
886
                                        if( valid_types.contains( params[ i ] ) )
588
887
                                                types.add( params[ i ] );
589
888
                        }
590
889
 
591
890
                        return types;
592
891
                }
593
892
 
594
 
                private UnencodeResult unencodeQuotedPrintable( String str, String charset )
 
893
                private UnencodeResult unencodeQuotedPrintable( ByteBuffer in )
595
894
                {
596
895
                        boolean another = false;
597
896
 
598
 
                        // default encoding scheme
599
 
                        if( charset == null ) charset = "UTF-8";
600
 
 
601
 
                        // unencode quoted-pritable encoding, as per RFC1521 section 5.1
602
 
                        byte[] bytes = new byte[ str.length() ];
 
897
                        // unencode quoted-printable encoding, as per RFC1521 section 5.1
 
898
                        byte[] out = new byte[ in.limit() - in.position() ];
603
899
                        int j = 0;
604
 
                        for( int i = 0; i < str.length(); i++ )
 
900
                        for( int i = in.position(); i < in.limit(); i++ )
605
901
                        {
606
902
                                // get next char and process...
607
 
                                char ch = str.charAt( i );
608
 
                                if( ch == '=' && i < str.length() - 2 )
 
903
                                byte ch = in.array()[ i ];
 
904
                                if( ch == '=' && i < in.limit() - 2 )
609
905
                                {
610
906
                                        // we found a =XX format byte, add it
611
 
                                        bytes[ j ] = (byte)(
612
 
                                                        Character.digit( str.charAt( i + 1 ), 16 ) * 16 +
613
 
                                                        Character.digit( str.charAt( i + 2 ), 16 ) );
 
907
                                        out[ j ] = (byte)(
 
908
                                                        Character.digit( in.array()[ i + 1 ], 16 ) * 16 +
 
909
                                                        Character.digit( in.array()[ i + 2 ], 16 ) );
614
910
                                        i += 2;
615
911
                                }
616
 
                                else if( ch == '=' && i == str.length() - 1 )
 
912
                                else if( ch == '=' && i == in.limit() - 1 )
617
913
                                {
618
914
                                        // we found a '=' at the end of a line signifying a multi-
619
915
                                        // line string, so we don't add it.
622
918
                                }
623
919
                                else
624
920
                                        // just a normal char...
625
 
                                        bytes[ j ] = (byte)ch;
 
921
                                        out[ j ] = (byte)ch;
626
922
                                j++;
627
923
                        }
628
924
 
629
 
                        return new UnencodeResult( another, bytes, j );
 
925
                        return new UnencodeResult( another, ByteBuffer.wrap( out, 0, j ) );
 
926
                }
 
927
 
 
928
                private ByteBuffer transcodeAsciiToUtf8( ByteBuffer in )
 
929
                {
 
930
                        // transcode
 
931
                        byte[] out = new byte[ ( in.limit() - in.position() ) * 2 ];
 
932
                        int j = 0;
 
933
                        for( int a = in.position(); a < in.limit(); a++ )
 
934
                        {
 
935
                                // if char is < 127, keep it as-is
 
936
                                if( in.array()[ a ] >= 0 )
 
937
                                        out[ j++ ] = in.array()[ a ];
 
938
 
 
939
                                // else, convert it to UTF-8
 
940
                                else {
 
941
                                        int b = 0xff & (int)in.array()[ a ];
 
942
                                        out[ j++ ] = (byte)( 0xc0 | ( b >> 6 ) );
 
943
                                        out[ j++ ] = (byte)( 0x80 | ( b & 0x3f ) );
 
944
                                }
 
945
                        }
 
946
 
 
947
                        return ByteBuffer.wrap( out, 0, j );
630
948
                }
631
949
        }
632
950
}