public MaryData process(MaryData d) throws Exception { String plainText = MaryUtils.normaliseUnicodePunctuation(d.getPlainText()); MaryData result = new MaryData(outputType(), d.getLocale(), true); Document doc = result.getDocument(); Element root = doc.getDocumentElement(); Locale l = determineLocale(plainText, d.getLocale()); root.setAttribute("xml:lang", MaryUtils.locale2xmllang(l)); if (splitIntoParagraphs) { // Empty lines separate paragraphs String[] inputTexts = plainText.split("\\n(\\s*\\n)+"); for (int i = 0; i < inputTexts.length; i++) { String paragraph = inputTexts[i].trim(); if (paragraph.length() == 0) continue; appendParagraph(paragraph, root, d.getLocale()); } } else { // The whole text as one single paragraph appendParagraph(plainText, root, d.getLocale()); } result.setDocument(doc); return result; }
public MaryData process(MaryData d) throws Exception { String plainText = MaryUtils.normaliseUnicodePunctuation(d.getPlainText()); MaryData result = new MaryData(outputType(), d.getLocale(), true); Document doc = result.getDocument(); Element root = doc.getDocumentElement(); Locale l = determineLocale(plainText, d.getLocale()); root.setAttribute("xml:lang", MaryUtils.locale2xmllang(l)); if (splitIntoParagraphs) { // Empty lines separate paragraphs String[] inputTexts = plainText.split("\\n(\\s*\\n)+"); for (int i = 0; i < inputTexts.length; i++) { String paragraph = inputTexts[i].trim(); if (paragraph.length() == 0) continue; appendParagraph(paragraph, root, d.getLocale()); } } else { // The whole text as one single paragraph appendParagraph(plainText, root, d.getLocale()); } result.setDocument(doc); return result; }
public MaryData process(MaryData d) throws Exception { String plainText = MaryUtils.normaliseUnicodePunctuation(d.getPlainText()); MaryData result = new MaryData(outputType(), d.getLocale(), true); Document doc = result.getDocument(); Element root = doc.getDocumentElement(); Locale l = determineLocale(plainText, d.getLocale()); root.setAttribute("xml:lang", MaryUtils.locale2xmllang(l)); if (splitIntoParagraphs) { // Empty lines separate paragraphs String[] inputTexts = plainText.split("\\n(\\s*\\n)+"); for (int i = 0; i < inputTexts.length; i++) { String paragraph = inputTexts[i].trim(); if (paragraph.length() == 0) continue; appendParagraph(paragraph, root, d.getLocale()); } } else { // The whole text as one single paragraph appendParagraph(plainText, root, d.getLocale()); } result.setDocument(doc); return result; }