Changeset 6000


Ignore:
Timestamp:
02/20/15 14:49:29 (9 years ago)
Author:
teckart@informatik.uni-leipzig.de
Message:

More tolerant postprocessing by reducing consecutive whitespaces to a single space

File:
1 edited

Legend:

Unmodified
Added
Removed
  • vlo/trunk/vlo-importer/src/main/java/eu/clarin/cmdi/vlo/importer/OrganisationPostProcessor.java

    r5887 r6000  
    1515import javax.xml.xpath.XPathExpressionException;
    1616import javax.xml.xpath.XPathFactory;
     17import org.slf4j.Logger;
     18import org.slf4j.LoggerFactory;
    1719import org.w3c.dom.Document;
    1820import org.w3c.dom.Node;
     
    2325
    2426    private static Map<String, String> organisationNamesMap = null;
     27    private final static Logger LOG = LoggerFactory.getLogger(OrganisationPostProcessor.class);
    2528
    2629    /**
     
    3538    @Override
    3639    public List<String> process(String value) {
    37         String[] splitArray = value.split(";");
     40        String[] splitArray = normalizeString(value).split(";");
    3841        for (int i = 0; i < splitArray.length; i++) {
    3942            String orgaName = splitArray[i];
     
    4245            }
    4346        }
    44 
     47       
    4548        return Arrays.asList(splitArray);
     49    }
     50   
     51    private String normalizeString(String value) {
     52        return value.replaceAll("\\s+", " ");
    4653    }
    4754
Note: See TracChangeset for help on using the changeset viewer.