154
148
private void importVCardFile( File file ) throws AbortImportException
156
// check file is good
158
showError( getText( R.string.error_filenotfound ) +
160
if( file.length() == 0 )
161
showError( getText( R.string.error_fileisempty ) +
167
FileInputStream istream = new FileInputStream( file );
168
byte[] content = new byte[ (int)file.length() ];
169
istream.read( content );
172
importVCardFileContent( content, file.getName() );
153
BufferedReader reader = new BufferedReader(
154
new FileReader( file ) );
157
StringBuffer content = new StringBuffer();
159
while( ( line = reader.readLine() ) != null )
160
content.append( line ).append( "\n" );
162
importVCardFileContent( content.toString(), file.getName() );
174
164
catch( FileNotFoundException e ) {
175
showError( getText( R.string.error_filenotfound ) +
165
showError( getText( R.string.error_filenotfound ) + file.getName() );
178
167
catch( IOException e ) {
179
168
showError( getText( R.string.error_ioerror ) + file.getName() );
183
private void importVCardFileContent( byte[] content, String fileName )
184
throws AbortImportException
172
private void importVCardFileContent( String content, String fileName )
173
throws AbortImportException
175
// unfold RFC2425 section 5.8.1 folded lines, except that we must also
176
// handle embedded Quoted-Printable encodings that have a trailing '='.
177
// So we remove these first before doing RFC2425 unfolding.
178
content = content.replaceAll( "=\n[ \\t]", "" )
179
.replaceAll( "\n[ \\t]", "" );
181
// get lines and parse them
182
String[] lines = content.split( "\n" );
187
183
VCard vCard = null;
188
ContentLineIterator cli = new ContentLineIterator( content );
189
while( cli.hasNext() )
184
for( int i = 0; i < lines.length; i++ )
191
ByteBuffer buffer = cli.next();
193
// get a US-ASCII version of the line for processing
196
line = new String( buffer.array(), buffer.position(),
197
buffer.limit() - buffer.position(), "US-ASCII" );
199
catch( UnsupportedEncodingException e ) {
200
// we know US-ASCII is supported, so appease the compiler...
186
String line = lines[ i ];
204
188
if( vCard == null ) {
205
189
// look for vcard beginning
206
if( line.matches( "^BEGIN:VCARD" ) ) {
190
if( line.matches( "^BEGIN[ \\t]*:[ \\t]*VCARD" ) ) {
207
191
setProgress( ++_progress );
208
192
vCard = new VCard();
212
196
// look for vcard content or ending
213
if( line.matches( "^END:VCARD" ) )
197
if( line.matches( "^END[ \\t]*:[ \\t]*VCARD" ) )
215
199
// store vcard and do away with it
387
272
@SuppressWarnings("serial")
388
273
protected class SkipContactException extends Exception { }
390
private String extractCollonPartFromLine( ByteBuffer buffer,
391
String line, boolean former )
395
// get a US-ASCII version of the line for processing, unless we were
399
line = new String( buffer.array(), buffer.position(),
400
buffer.limit() - buffer.position(), "US-ASCII" );
402
catch( UnsupportedEncodingException e ) {
403
// we know US-ASCII is supported, so appease the compiler...
408
// split line into name and value parts and check to make sure we
409
// only got 2 parts and that the first part is not zero in length
410
String[] parts = line.split( ":", 2 );
411
if( parts.length == 2 && parts[ 0 ].length() > 0 )
412
ret = parts[ former? 0 : 1 ];
417
private String extractNameAndParamsFromLine( ByteBuffer buffer,
420
return extractCollonPartFromLine( buffer, line, true );
423
private String extractValueFromLine( ByteBuffer buffer, String line )
425
return extractCollonPartFromLine( buffer, line, false );
428
public void parseLine( ByteBuffer buffer, String line,
429
boolean next_line_looks_folded )
430
throws ParseException, SkipContactException,
433
// do we have a version yet?
275
public void parseLine( String line )
276
throws ParseException, SkipContactException,
279
// get property halves
280
String[] props = line.split( ":" );
281
for( int i = 0; i < props.length; i++ )
282
props[ i ] = props[ i ].trim();
283
if( props.length < 2 ||
284
props[ 0 ].length() < 1 || props[ 1 ].length() < 1 )
285
throw new ParseException( R.string.error_vcf_malformed );
434
287
if( _version == null )
436
// tentatively get name and params from line
437
String name_and_params =
438
extractNameAndParamsFromLine( buffer, line );
440
// is it a version line?
441
if( name_and_params != null &&
442
name_and_params.equals( "VERSION" ) )
289
if( props[ 0 ].equals( "VERSION" ) )
445
String value = extractValueFromLine( buffer, line );
446
if( !value.equals( "2.1" ) && !value.equals( "3.0" ) )
292
if( !props[ 1 ].equals( "2.1" ) &&
293
!props[ 1 ].equals( "3.0" ) )
447
294
throw new ParseException( R.string.error_vcf_version );
295
_version = props[ 1 ];
450
// parse any buffers we've been accumulating while we waited
452
if( _buffers != null )
453
for( int i = 0; i < _buffers.size(); i++ )
454
parseLine( _buffers.get( i ), null,
455
i + 1 < _buffers.size() &&
456
_buffers.get( i + 1 ).hasRemaining() &&
457
_buffers.get( i + 1 ).get(
458
_buffers.get( i + 1 ).position() ) == ' ' );
297
// parse any other lines we've accumulated so far
299
for( int i = 0; i < _lines.size(); i++ )
300
parseLine( _lines.get( i ) );
463
// no, so stash this line till we get a version
464
if( _buffers == null )
465
_buffers = new Vector< ByteBuffer >();
466
_buffers.add( buffer );
305
// stash this line till we have a version
307
_lines = new Vector< String >();
471
// name and params and the position in the buffer where the
472
// "value" part of the line start
473
String name_and_params;
476
if( _parser_multiline_state != MULTILINE_NONE )
478
// if we're currently in a multi-line value, use the stored
479
// property name and parameters
480
name_and_params = _parser_current_name_and_params;
482
// skip some initial line characters, depending on the type
483
// of multi-line we're handling
484
pos = buffer.position();
485
switch( _parser_multiline_state )
487
case MULTILINE_FOLDED:
490
case MULTILINE_ENCODED:
491
while( pos < buffer.limit() && (
492
buffer.get( pos ) == ' ' ||
493
buffer.get( pos ) == '\t' ) )
502
// take us out of multi-line so that we can re-detect that
503
// this line is a multi-line or not
504
_parser_multiline_state = MULTILINE_NONE;
508
// get name and params from line, and since we're not
509
// parsing a subsequent line in a multi-line, this should
510
// not fail, or it's an error
512
extractNameAndParamsFromLine( buffer, line );
513
if( name_and_params == null )
514
throw new ParseException(
515
R.string.error_vcf_malformed );
517
// calculate how many chars to skip from beginning of line
518
// so we skip the property "name:" part
519
pos = buffer.position() + name_and_params.length() + 1;
521
// reset the saved multi-line state
522
_parser_current_name_and_params = name_and_params;
523
_parser_buffered_value_so_far = "";
526
// get value from buffer, as raw bytes
528
value = ByteBuffer.wrap( buffer.array(), pos,
529
buffer.limit() - pos );
531
313
// get parameter parts
532
String[] name_param_parts = name_and_params.split( ";", -1 );
533
for( int i = 0; i < name_param_parts.length; i++ )
534
name_param_parts[ i ] = name_param_parts[ i ].trim();
536
// parse encoding parameter
537
String encoding = checkParam( name_param_parts, "ENCODING" );
538
if( encoding != null ) encoding = encoding.toUpperCase();
539
if( encoding != null && !encoding.equals( "8BIT" ) &&
540
!encoding.equals( "QUOTED-PRINTABLE" ) )
541
//&& !encoding.equals( "BASE64" ) )
543
throw new ParseException( R.string.error_vcf_encoding );
546
// parse charset parameter
547
String charset = checkParam( name_param_parts, "CHARSET" );
548
if( charset != null ) charset = charset.toUpperCase();
549
if( charset != null && !charset.equals( "US-ASCII" ) &&
550
!charset.equals( "ASCII" ) &&
551
!charset.equals( "UTF-8" ) )
553
throw new ParseException( R.string.error_vcf_charset );
556
// do unencoding (or default to a fake unencoding result with
558
UnencodeResult unencoding_result = null;
559
if( encoding != null && encoding.equals( "QUOTED-PRINTABLE" ) )
560
unencoding_result = unencodeQuotedPrintable( value );
561
// else if( encoding != null && encoding.equals( "BASE64" ) )
562
// unencoding_result = unencodeBase64( props[ 1 ], charset );
563
if( unencoding_result != null ) {
564
value = unencoding_result.getBuffer();
565
if( unencoding_result.isAnotherLineRequired() )
566
_parser_multiline_state = MULTILINE_ENCODED;
569
// convert 8-bit ASCII charset to US-ASCII
570
if( charset == null || charset.equals( "ASCII" ) ) {
571
value = transcodeAsciiToUtf8( value );
578
string_value = new String( value.array(), value.position(),
579
value.limit() - value.position(), charset );
580
} catch( UnsupportedEncodingException e ) {
581
throw new ParseException( R.string.error_vcf_charset );
584
// for some entries that have semicolon-separated value parts,
585
// check to see if the value ends in an escape character, which
586
// indicates that we have a multi-line value
587
if( ( name_param_parts[ 0 ].equals( "N" ) ||
588
name_param_parts[ 0 ].equals( "ORG" ) ||
589
name_param_parts[ 0 ].equals( "ADR" ) ) &&
590
doesStringEndInAnEscapeChar( string_value ) )
592
_parser_multiline_state = MULTILINE_ESCAPED;
593
string_value = string_value.substring( 0,
594
string_value.length() - 1 );
597
// now we know whether we're in an encoding multi-line,
598
// determine if we're in a v3 folded multi-line or not
599
if( _parser_multiline_state == MULTILINE_NONE &&
600
_version.equals( "3.0" ) && next_line_looks_folded )
602
_parser_multiline_state = MULTILINE_FOLDED;
605
// handle multi-lines by buffering them and parsing them when we
606
// are processing the last line in a multi-line sequence
607
if( _parser_multiline_state != MULTILINE_NONE ) {
608
_parser_buffered_value_so_far += string_value;
611
String complete_value =
612
( _parser_buffered_value_so_far + string_value ).trim();
614
// ignore empty values
615
if( complete_value.length() < 1 ) return;
314
String[] params = props[ 0 ].split( ";" );
315
for( int i = 0; i < params.length; i++ )
316
params[ i ] = params[ i ].trim();
617
318
// parse some properties
618
if( name_param_parts[ 0 ].equals( "N" ) )
619
parseN( name_param_parts, complete_value );
620
else if( name_param_parts[ 0 ].equals( "FN" ) )
621
parseFN( name_param_parts, complete_value );
622
else if( name_param_parts[ 0 ].equals( "ORG" ) )
623
parseORG( name_param_parts, complete_value );
624
else if( name_param_parts[ 0 ].equals( "TEL" ) )
625
parseTEL( name_param_parts, complete_value );
626
else if( name_param_parts[ 0 ].equals( "EMAIL" ) )
627
parseEMAIL( name_param_parts, complete_value );
628
else if( name_param_parts[ 0 ].equals( "ADR" ) )
629
parseADR( name_param_parts, complete_value );
633
private boolean doesStringEndInAnEscapeChar( String string )
635
// count the number of backslashes at the end of the string
637
for( int a = string.length() - 1; a >= 0; a-- )
638
if( string.charAt( a ) == '\\' )
643
// if there are an even number of backslashes then the final one
645
return ( count & 1 ) == 1;
648
private String[] splitValueBySemicolon( String value )
650
// split string in to parts by semicolon
651
ArrayList< String > parts = new ArrayList< String >(
652
Arrays.asList( value.split( ";" ) ) );
655
for( int a = 0; a < parts.size(); a++ )
657
String str = parts.get( a );
659
// look for parts that end in an escape character, but ignore
660
// the final part. We've already detected escape chars at the
661
// end of the final part in parseLine() and handled multi-lines
663
if( a < parts.size() - 1 &&
664
doesStringEndInAnEscapeChar( str ) )
666
// join the next part to this part and remove the next part
667
parts.set( a, str.substring( 0, str.length() - 1 ) +
668
';' + parts.get( a + 1 ) );
669
parts.remove( a + 1 );
671
// re-visit this part
676
// trim and replace string
681
String[] ret = new String[ parts.size() ];
682
return parts.toArray( ret );
319
if( params[ 0 ].equals( "N" ) )
320
parseN( params, props[ 1 ] );
321
else if( params[ 0 ].equals( "FN" ) )
322
parseFN( params, props[ 1 ] );
323
else if( params[ 0 ].equals( "ORG" ) )
324
parseORG( params, props[ 1 ] );
325
else if( params[ 0 ].equals( "TEL" ) )
326
parseTEL( params, props[ 1 ] );
327
else if( params[ 0 ].equals( "EMAIL" ) )
328
parseEMAIL( params, props[ 1 ] );
685
332
private void parseN( String[] params, String value )
686
throws ParseException, SkipContactException,
333
throws ParseException, SkipContactException,
689
336
// already got a better name?
690
if( _name_level >= NAMELEVEL_N ) return;
337
if( _nameLevel >= NAMELEVEL_N ) return;
692
339
// get name parts
693
String[] name_parts = splitValueBySemicolon( value );
340
String[] nameparts = value.split( ";" );
341
for( int i = 0; i < nameparts.length; i++ )
342
nameparts[ i ] = nameparts[ i ].trim();
697
if( name_parts.length > 1 && name_parts[ 1 ].length() > 0 )
698
value += name_parts[ 1 ];
699
if( name_parts.length > 0 && name_parts[ 0 ].length() > 0 )
700
value += ( value.length() == 0? "" : " " ) + name_parts[ 0 ];
346
if( nameparts.length > 1 && nameparts[ 1 ].length() > 0 )
347
value += nameparts[ 1 ];
348
if( nameparts[ 0 ].length() > 0 )
349
value += ( value.length() == 0? "" : " " ) + nameparts[ 0 ];
704
_name_level = NAMELEVEL_N;
352
setName( undoCharsetAndEncoding( params, value ) );
353
_nameLevel = NAMELEVEL_N;
706
355
// check now to see if we need to import this contact (to avoid
707
356
// parsing the rest of the vCard unnecessarily)
712
361
private void parseFN( String[] params, String value )
713
throws ParseException, SkipContactException
362
throws ParseException, SkipContactException
715
364
// already got a better name?
716
if( _name_level >= NAMELEVEL_FN ) return;
365
if( _nameLevel >= NAMELEVEL_FN ) return;
720
_name_level = NAMELEVEL_FN;
368
setName( undoCharsetAndEncoding( params, value ) );
369
_nameLevel = NAMELEVEL_FN;
723
372
private void parseORG( String[] params, String value )
724
throws ParseException, SkipContactException
373
throws ParseException, SkipContactException
726
375
// already got a better name?
727
if( _name_level >= NAMELEVEL_ORG ) return;
376
if( _nameLevel >= NAMELEVEL_ORG ) return;
730
String[] org_parts = splitValueBySemicolon( value );
379
String[] orgparts = value.split( ";" );
380
for( int i = 0; i < orgparts.length; i++ )
381
orgparts[ i ] = orgparts[ i ].trim();
733
if( org_parts.length > 1 && org_parts[ 0 ].length() == 0 )
734
value = org_parts[ 1 ];
735
else if( org_parts.length > 1 && org_parts[ 1 ].length() > 0 )
736
value = org_parts[ 0 ] + ", " + org_parts[ 1 ];
384
if( orgparts[ 0 ].length() == 0 && orgparts.length > 1 )
385
value = orgparts[ 1 ];
738
value = org_parts[ 0 ];
387
value = orgparts[ 0 ];
742
_name_level = NAMELEVEL_ORG;
390
setName( undoCharsetAndEncoding( params, value ) );
391
_nameLevel = NAMELEVEL_ORG;
745
394
private void parseTEL( String[] params, String value )
746
throws ParseException
395
throws ParseException
748
397
if( value.length() == 0 ) return;
750
399
Set< String > types = extractTypes( params, Arrays.asList(
751
"PREF", "HOME", "WORK", "VOICE", "FAX", "MSG", "CELL",
752
"PAGER", "BBS", "MODEM", "CAR", "ISDN", "VIDEO" ) );
400
"PREF", "HOME", "WORK", "VOICE", "FAX", "MSG", "CELL",
401
"PAGER", "BBS", "MODEM", "CAR", "ISDN", "VIDEO" ) );
754
403
// here's the logic...
755
404
boolean preferred = types.contains( "PREF" );
756
int type = PhonesColumns.TYPE_MOBILE;
757
405
if( types.contains( "VOICE" ) )
758
406
if( types.contains( "WORK" ) )
759
type = PhonesColumns.TYPE_WORK;
407
addPhone( value, PhonesColumns.TYPE_WORK, preferred );
761
type = PhonesColumns.TYPE_HOME;
409
addPhone( value, PhonesColumns.TYPE_HOME, preferred );
762
410
else if( types.contains( "CELL" ) || types.contains( "VIDEO" ) )
763
type = PhonesColumns.TYPE_MOBILE;
411
addPhone( value, PhonesColumns.TYPE_MOBILE, preferred );
764
412
if( types.contains( "FAX" ) )
765
413
if( types.contains( "HOME" ) )
766
type = PhonesColumns.TYPE_FAX_HOME;
414
addPhone( value, PhonesColumns.TYPE_FAX_HOME, preferred );
768
type = PhonesColumns.TYPE_FAX_WORK;
416
addPhone( value, PhonesColumns.TYPE_FAX_WORK, preferred );
769
417
if( types.contains( "PAGER" ) )
770
type = PhonesColumns.TYPE_PAGER;
773
addPhone( value, type, preferred );
418
addPhone( value, PhonesColumns.TYPE_PAGER, preferred );
776
421
public void parseEMAIL( String[] params, String value )
777
throws ParseException
779
423
if( value.length() == 0 ) return;
781
425
Set< String > types = extractTypes( params, Arrays.asList(
782
"PREF", "WORK", "HOME", "INTERNET" ) );
426
"PREF", "WORK", "HOME", "INTERNET" ) );
428
// here's the logic...
785
429
boolean preferred = types.contains( "PREF" );
786
430
if( types.contains( "WORK" ) )
787
431
addEmail( value, Contacts.ContactMethods.TYPE_WORK, preferred );
789
433
addEmail( value, Contacts.ContactMethods.TYPE_HOME, preferred );
792
private void parseADR( String[] params, String value )
793
throws ParseException, SkipContactException
796
String[] adr_parts = splitValueBySemicolon( value );
800
for( int a = 0; a < adr_parts.length; a++ ) {
801
if( value.length() > 0 ) value += "\n";
802
value += adr_parts[ a ].trim();
805
Set< String > types = extractTypes( params, Arrays.asList(
806
"PREF", "WORK", "HOME", "INTERNET" ) );
809
if( types.contains( "WORK" ) )
810
addAddress( value, Contacts.ContactMethods.TYPE_WORK );
812
addAddress( value, Contacts.ContactMethods.TYPE_HOME);
815
436
public void finaliseParsing()
816
throws ParseException, SkipContactException,
437
throws ParseException, SkipContactException,
819
440
// missing version (and data is present)
820
if( _version == null && _buffers != null )
441
if( _version == null && _lines != null )
821
442
throw new ParseException( R.string.error_vcf_malformed );
823
444
// missing name properties?
824
if( _name_level == NAMELEVEL_NONE )
445
if( _nameLevel == NAMELEVEL_NONE )
825
446
throw new ParseException( R.string.error_vcf_noname );
827
448
// check if we should import this one? If we've already got an 'N'-
828
449
// type name, this will already have been done by parseN() so we
829
450
// mustn't do this here (or it could prompt twice!)
830
if( _name_level < NAMELEVEL_N && !isImportRequired( getName() ) )
451
if( _nameLevel < NAMELEVEL_N && !isImportRequired( getName() ) )
831
452
throw new SkipContactException();
455
private String undoCharsetAndEncoding( String[] params, String value )
456
throws ParseException
458
// check encoding/charset
459
String charset, encoding;
460
if( ( charset = checkParam( params, "CHARSET" ) ) != null &&
461
!charset.equals( "UTF-8" ) && !charset.equals( "UTF-16" ) )
462
throw new ParseException( R.string.error_vcf_charset );
463
if( ( encoding = checkParam( params, "ENCODING" ) ) != null &&
464
!encoding.equals( "QUOTED-PRINTABLE" ) )
465
throw new ParseException( R.string.error_vcf_encoding );
468
if( encoding != null && encoding.equals( "QUOTED-PRINTABLE" ) )
469
return unencodeQuotedPrintable( value, charset );
834
475
private String checkParam( String[] params, String name )
836
Pattern p = Pattern.compile(
837
"^" + name + "[ \\t]*=[ \\t]*(\"?)(.*)\\1$" );
477
Pattern p = Pattern.compile( "^" + name + "[ \\t]*=[ \\t]*(.*)$" );
838
478
for( int i = 0; i < params.length; i++ ) {
839
479
Matcher m = p.matcher( params[ i ] );
840
480
if( m.matches() )
846
486
private Set< String > extractTypes( String[] params,
847
List< String > valid_types )
487
List< String > validTypes )
849
489
HashSet< String > types = new HashSet< String >();
851
491
// get 3.0-style TYPE= param
853
if( ( type_param = checkParam( params, "TYPE" ) ) != null ) {
854
String[] parts = type_param.split( "," );
855
for( int i = 0; i < parts.length; i++ )
856
if( valid_types.contains( parts[ i ] ) )
857
types.add( parts[ i ] );
493
if( ( typeParam = checkParam( params, "TYPE" ) ) != null ) {
494
String[] bits = typeParam.split( "," );
495
for( int i = 0; i < bits.length; i++ )
496
if( validTypes.contains( bits[ i ] ) )
497
types.add( bits[ i ] );
860
500
// get 2.1-style type param
861
501
if( _version.equals( "2.1" ) ) {
862
502
for( int i = 1; i < params.length; i++ )
863
if( valid_types.contains( params[ i ] ) )
503
if( validTypes.contains( params[ i ] ) )
864
504
types.add( params[ i ] );
870
private UnencodeResult unencodeQuotedPrintable( ByteBuffer in )
510
private String unencodeQuotedPrintable( String str, String charset )
872
boolean another = false;
512
// default encoding scheme
513
if( charset == null ) charset = "UTF-8";
874
// unencode quoted-printable encoding, as per RFC1521 section 5.1
875
byte[] out = new byte[ in.limit() - in.position() ];
515
// unencode quoted-pritable encoding, as per RFC1521 section 5.1
516
byte[] bytes = new byte[ str.length() ];
877
for( int i = in.position(); i < in.limit(); i++ )
879
// get next char and process...
880
byte ch = in.array()[ i ];
881
if( ch == '=' && i < in.limit() - 2 )
883
// we found a =XX format byte, add it
885
Character.digit( in.array()[ i + 1 ], 16 ) * 16 +
886
Character.digit( in.array()[ i + 2 ], 16 ) );
518
for( int i = 0; i < str.length(); i++, j++ ) {
519
char ch = str.charAt( i );
520
if( ch == '=' && i < str.length() - 2 ) {
522
Character.digit( str.charAt( i + 1 ), 16 ) * 16 +
523
Character.digit( str.charAt( i + 2 ), 16 ) );
889
else if( ch == '=' && i == in.limit() - 1 )
891
// we found a '=' at the end of a line signifying a multi-
892
// line string, so we don't add it.
897
// just a normal char...
902
return new UnencodeResult( another, ByteBuffer.wrap( out, 0, j ) );
905
private ByteBuffer transcodeAsciiToUtf8( ByteBuffer in )
908
byte[] out = new byte[ ( in.limit() - in.position() ) * 2 ];
910
for( int a = in.position(); a < in.limit(); a++ )
912
// if char is < 127, keep it as-is
913
if( in.array()[ a ] >= 0 )
914
out[ j++ ] = in.array()[ a ];
916
// else, convert it to UTF-8
918
int b = 0xff & (int)in.array()[ a ];
919
out[ j++ ] = (byte)( 0xc0 | ( b >> 6 ) );
920
out[ j++ ] = (byte)( 0x80 | ( b & 0x3f ) );
924
return ByteBuffer.wrap( out, 0, j );
527
bytes[ j ] = (byte)ch;
530
return new String( bytes, 0, j, charset );
531
} catch( UnsupportedEncodingException e ) { }