From 76c496db007519125bd478ad81afb9763db7259c Mon Sep 17 00:00:00 2001 From: rsiddharth Date: Fri, 26 Oct 2012 21:48:35 +0530 Subject: added: parsers/DocumentDate.java modified: parsers/Paragraphs.java --- parsers/DocumentDate.java | 17 +++++++++++++++++ parsers/Paragraphs.java | 1 - 2 files changed, 17 insertions(+), 1 deletion(-) create mode 100644 parsers/DocumentDate.java diff --git a/parsers/DocumentDate.java b/parsers/DocumentDate.java new file mode 100644 index 0000000..717fe25 --- /dev/null +++ b/parsers/DocumentDate.java @@ -0,0 +1,17 @@ +package scruf.parsers; + +import java.util.regex.*; + +public class DocumentDate implements Parser { + public String parse(String fileContent) { + String timeTag = "
$2
\n"; + StringBuffer sbuffer = new StringBuffer(); + Pattern pattern = Pattern.compile("(\\$\\$\\$)(.+?)(\\1)"); + Matcher matcher = pattern.matcher(fileContent); + while(matcher.find()) { + matcher.appendReplacement(sbuffer,timeTag); + } + matcher.appendTail(sbuffer); + return sbuffer.toString(); + } +} \ No newline at end of file diff --git a/parsers/Paragraphs.java b/parsers/Paragraphs.java index 2229d35..29a546a 100644 --- a/parsers/Paragraphs.java +++ b/parsers/Paragraphs.java @@ -26,7 +26,6 @@ import java.util.regex.*; public class Paragraphs implements Parser { private String paragraph = "

\n$0

\n"; public String parse(String fileContent) { - System.out.println("Paragraph parsing..."); /** * This regex contains two parts seperated by a '|'; the first * part is regex for a html Heading (See Heading.java) and the -- cgit v1.2.3