Subversion Repository Public Repository

litesoft

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
// This Source Code is in the Public Domain per: http://unlicense.org
package org.litesoft.core.util.text;

import org.litesoft.commonfoundation.charstreams.*;
import org.litesoft.commonfoundation.typeutils.*;

import java.util.*;

public class CodedTextParser {
    public static List<String> parse( String pText ) {
        ArrayList<String> rv = new ArrayList<String>();
        if ( pText != null ) {
            CharSource zSource = new CharSourceFromSequence( pText );
            if ( consumeNonVisible7bitAscii( zSource ) ) {
                do {
                    if ( !rv.isEmpty() ) {
                        rv.add( " " );
                    }
                    addChunk( rv, getUpToNonVisible7bitAscii( zSource ) );
                }
                while ( consumeNonVisible7bitAscii( zSource ) );
            }
        }
        return rv;
    }

    private static String getUpToNonVisible7bitAscii( CharSource pSource ) {
        if ( !pSource.anyRemaining() ) {
            return "";
        }
        StringBuilder sb = new StringBuilder();
        for ( int c = pSource.peek(); (c != -1) && ((' ' < c) && (c <= 126)); c = pSource.peek() ) {
            sb.append( pSource.getRequired() );
        }
        return sb.toString();
    }

    private static boolean consumeNonVisible7bitAscii( CharSource pSource ) {
        for ( int c = pSource.peek(); (c != -1) && ((c <= ' ') || (126 < c)); c = pSource.peek() ) {
            pSource.get(); // Consume
        }
        return pSource.anyRemaining();
    }

    private static void addChunk( List<String> pCollector, String pToken ) {
        if ( pToken.length() > 1 ) {
            int zLeadingPunc = 0;
            while ( zLeadingPunc < pToken.length() && !Characters.isAlphaNumeric( pToken.charAt( zLeadingPunc ) ) ) {
                zLeadingPunc++;
            }
            if ( zLeadingPunc != pToken.length() ) {
                if ( zLeadingPunc != 0 ) {
                    pCollector.add( pToken.substring( 0, zLeadingPunc ) );
                    pToken = pToken.substring( zLeadingPunc );
                }

                int zTrailingPunc = 0;
                while ( !Characters.isAlphaNumeric( pToken.charAt( pToken.length() - (zTrailingPunc + 1) ) ) ) {
                    zTrailingPunc++;
                }
                if ( zTrailingPunc != 0 ) {
                    int zAt = pToken.length() - zTrailingPunc;
                    pCollector.add( pToken.substring( 0, zAt ) );
                    pToken = pToken.substring( zAt );
                }
            }
        }
        pCollector.add( pToken );
    }
}

Commits for litesoft/trunk/Java/core/Anywhere/src/org/litesoft/core/util/text/CodedTextParser.java

Diff revisions: vs.
Revision Author Commited Message
948 Diff Diff GeorgeS picture GeorgeS Sat 07 Jun, 2014 23:42:39 +0000

Jusefuls Formatter Updated to New Code Format

947 Diff Diff GeorgeS picture GeorgeS Fri 06 Jun, 2014 23:36:56 +0000

Correct Spelling of package!

942 Diff Diff GeorgeS picture GeorgeS Mon 02 Jun, 2014 23:41:46 +0000

Extracting commonfoundation

939 Diff Diff GeorgeS picture GeorgeS Mon 02 Jun, 2014 21:30:31 +0000

Extracting commonfoundation

811 Diff Diff GeorgeS picture GeorgeS Sat 18 Aug, 2012 13:45:18 +0000
772 Diff Diff GeorgeS picture GeorgeS Sun 15 Jul, 2012 16:55:51 +0000

!

49 Diff Diff GeorgeS picture GeorgeS Mon 12 Apr, 2010 02:59:10 +0000

License Text

2 GeorgeS picture GeorgeS Sun 07 Feb, 2010 12:50:58 +0000