001/* 002 Licensed to the Apache Software Foundation (ASF) under one 003 or more contributor license agreements. See the NOTICE file 004 distributed with this work for additional information 005 regarding copyright ownership. The ASF licenses this file 006 to you under the Apache License, Version 2.0 (the 007 "License"); you may not use this file except in compliance 008 with the License. You may obtain a copy of the License at 009 010 http://www.apache.org/licenses/LICENSE-2.0 011 012 Unless required by applicable law or agreed to in writing, 013 software distributed under the License is distributed on an 014 "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY 015 KIND, either express or implied. See the License for the 016 specific language governing permissions and limitations 017 under the License. 018 */ 019package org.apache.wiki.htmltowiki; 020 021import java.io.IOException; 022import java.io.Writer; 023import java.util.regex.Matcher; 024import java.util.regex.Pattern; 025 026/** 027 * Part of the XHtmlToWikiTranslator. 028 * 029 */ 030// FIXME: Needs a better description as to how it works. 031public class WhitespaceTrimWriter extends Writer 032{ 033 034 private final StringBuffer m_result = new StringBuffer(); 035 036 private StringBuffer m_buffer = new StringBuffer(); 037 038 private boolean m_trimMode = true; 039 040 private static final Pattern ONLINE_PATTERN = Pattern.compile( ".*?\\n\\s*?", Pattern.MULTILINE ); 041 042 private boolean m_currentlyOnLineBegin = true; 043 044 /** 045 * {@inheritDoc} 046 */ 047 @Override 048 public void flush() 049 { 050 if( m_buffer.length() > 0 ) 051 { 052 String s = m_buffer.toString(); 053 s = s.replaceAll( "\r\n", "\n" ); 054 if( m_trimMode ) 055 { 056 s = s.replaceAll( "(\\w+) \\[\\?\\|Edit\\.jsp\\?page=\\1\\]", "[$1]" ); 057 s = s.replaceAll( "\n{2,}", "\n\n" ); 058 s = s.replaceAll( "\\p{Blank}+", " " ); 059 s = s.replaceAll( "[ ]*\n[ ]*", "\n" ); 060 s = replacePluginNewlineBackslashes( s ); 061 } 062 m_result.append( s ); 063 m_buffer = new StringBuffer(); 064 } 065 } 066 067 private String replacePluginNewlineBackslashes( String s ) 068 { 069 final Pattern p = Pattern.compile( "\\{\\{\\{(.*?)\\}\\}\\}|\\{\\{(.*?)\\}\\}|\\[\\{(.*?)\\}\\]", Pattern.DOTALL 070 + Pattern.MULTILINE ); 071 final Matcher m = p.matcher( s ); 072 final StringBuffer sb = new StringBuffer(); 073 while( m.find() ) 074 { 075 final String groupEscaped = m.group().replaceAll( "\\\\|\\$", "\\\\$0" ); 076 if( m.group( 3 ) != null ) 077 { 078 m.appendReplacement( sb, groupEscaped.replaceAll( "\\\\\\\\\\\\\\\\", "\n" ) ); 079 } 080 else 081 { 082 m.appendReplacement( sb, groupEscaped ); 083 } 084 } 085 m.appendTail( sb ); 086 s = sb.toString(); 087 return s; 088 } 089 090 /** 091 * Returns true, if this Writer is currently trimming any whitespaces. 092 * 093 * @return True, if trimming. 094 */ 095 public boolean isWhitespaceTrimMode() 096 { 097 return m_trimMode; 098 } 099 100 /** 101 * Set the trimming mode on/off. 102 * 103 * @param trimMode True, if you want trimming to be turned on. False otherwise. 104 */ 105 public void setWhitespaceTrimMode(final boolean trimMode ) 106 { 107 if( m_trimMode != trimMode ) 108 { 109 flush(); 110 m_trimMode = trimMode; 111 } 112 } 113 114 /** 115 * {@inheritDoc} 116 */ 117 @Override 118 public void write(final char[] arg0, final int arg1, final int arg2 ) throws IOException 119 { 120 m_buffer.append( arg0, arg1, arg2 ); 121 m_currentlyOnLineBegin = ONLINE_PATTERN.matcher( m_buffer ).matches(); 122 } 123 124 /** 125 * {@inheritDoc} 126 */ 127 @Override 128 public void close() throws IOException 129 {} 130 131 /** 132 * {@inheritDoc} 133 */ 134 @Override 135 public String toString() 136 { 137 flush(); 138 return m_result.toString(); 139 } 140 141 /** 142 * Returns true, if the writer is currently writing a line start. 143 * 144 * @return True or false. 145 */ 146 public boolean isCurrentlyOnLineBegin() 147 { 148 return m_currentlyOnLineBegin; 149 } 150}