1*24acc546SAndrew Rist /**************************************************************
2cdf0e10cSrcweir  *
3*24acc546SAndrew Rist  * Licensed to the Apache Software Foundation (ASF) under one
4*24acc546SAndrew Rist  * or more contributor license agreements.  See the NOTICE file
5*24acc546SAndrew Rist  * distributed with this work for additional information
6*24acc546SAndrew Rist  * regarding copyright ownership.  The ASF licenses this file
7*24acc546SAndrew Rist  * to you under the Apache License, Version 2.0 (the
8*24acc546SAndrew Rist  * "License"); you may not use this file except in compliance
9*24acc546SAndrew Rist  * with the License.  You may obtain a copy of the License at
10*24acc546SAndrew Rist  *
11*24acc546SAndrew Rist  *   http://www.apache.org/licenses/LICENSE-2.0
12*24acc546SAndrew Rist  *
13*24acc546SAndrew Rist  * Unless required by applicable law or agreed to in writing,
14*24acc546SAndrew Rist  * software distributed under the License is distributed on an
15*24acc546SAndrew Rist  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16*24acc546SAndrew Rist  * KIND, either express or implied.  See the License for the
17*24acc546SAndrew Rist  * specific language governing permissions and limitations
18*24acc546SAndrew Rist  * under the License.
19*24acc546SAndrew Rist  *
20*24acc546SAndrew Rist  *************************************************************/
21*24acc546SAndrew Rist 
22*24acc546SAndrew Rist 
23cdf0e10cSrcweir 
24cdf0e10cSrcweir // MARKER(update_precomp.py): autogen include statement, do not remove
25cdf0e10cSrcweir #include "precompiled_forms.hxx"
26cdf0e10cSrcweir 
27cdf0e10cSrcweir #include <com/sun/star/xml/xpath/XPathObjectType.hpp>
28cdf0e10cSrcweir #include <com/sun/star/xml/dom/XNode.hpp>
29cdf0e10cSrcweir #include <com/sun/star/xml/dom/XText.hpp>
30cdf0e10cSrcweir #include <com/sun/star/xml/dom/XNodeList.hpp>
31cdf0e10cSrcweir #include <com/sun/star/xml/dom/NodeType.hpp>
32cdf0e10cSrcweir 
33cdf0e10cSrcweir #include <rtl/ustrbuf.hxx>
34cdf0e10cSrcweir #include <rtl/strbuf.hxx>
35cdf0e10cSrcweir #include <unotools/processfactory.hxx>
36cdf0e10cSrcweir 
37cdf0e10cSrcweir #include <stdio.h>
38cdf0e10cSrcweir 
39cdf0e10cSrcweir #include "serialization_urlencoded.hxx"
40cdf0e10cSrcweir 
41cdf0e10cSrcweir using namespace utl;
42cdf0e10cSrcweir using namespace CSS::uno;
43cdf0e10cSrcweir using namespace CSS::io;
44cdf0e10cSrcweir using namespace CSS::xml::xpath;
45cdf0e10cSrcweir using namespace CSS::xml::dom;
46cdf0e10cSrcweir 
CSerializationURLEncoded()47cdf0e10cSrcweir CSerializationURLEncoded::CSerializationURLEncoded()
48cdf0e10cSrcweir     : m_aFactory(getProcessServiceFactory())
49cdf0e10cSrcweir     , m_aPipe(Reference< XOutputStream > (m_aFactory->createInstance(
50cdf0e10cSrcweir         ::rtl::OUString::createFromAscii("com.sun.star.io.Pipe")), UNO_QUERY))
51cdf0e10cSrcweir {
52cdf0e10cSrcweir }
53cdf0e10cSrcweir 
54cdf0e10cSrcweir 
55cdf0e10cSrcweir /*
56cdf0e10cSrcweir  rfc2396
57cdf0e10cSrcweir  reserved    = ";" | "/" | "?" | ":" | "@" | "&" | "=" | "+" |
58cdf0e10cSrcweir                     "$" | ","
59cdf0e10cSrcweir  mark        = "-" | "_" | "." | "!" | "~" | "*" | "'" | "(" | ")"
60cdf0e10cSrcweir  unreserved = alphanum | mark
61cdf0e10cSrcweir */
is_unreserved(sal_Char c)62cdf0e10cSrcweir sal_Bool CSerializationURLEncoded::is_unreserved(sal_Char c)
63cdf0e10cSrcweir {
64cdf0e10cSrcweir     //digit?
65cdf0e10cSrcweir     if (c >= '0' && c <= '9') return sal_True;
66cdf0e10cSrcweir     if (c >= 'A' && c <= 'Z') return sal_True;
67cdf0e10cSrcweir     if (c >= 'a' && c <= 'z') return sal_True;
68cdf0e10cSrcweir     switch (c) {
69cdf0e10cSrcweir         case '-':
70cdf0e10cSrcweir         case '_':
71cdf0e10cSrcweir         case '.':
72cdf0e10cSrcweir         case '!':
73cdf0e10cSrcweir         case '~':
74cdf0e10cSrcweir         case '*':
75cdf0e10cSrcweir         case '\'':
76cdf0e10cSrcweir         case '(':
77cdf0e10cSrcweir         case ')':
78cdf0e10cSrcweir             return sal_True;
79cdf0e10cSrcweir     }
80cdf0e10cSrcweir     return sal_False;
81cdf0e10cSrcweir }
encode_and_append(const::rtl::OUString & aString,::rtl::OStringBuffer & aBuffer)82cdf0e10cSrcweir void  CSerializationURLEncoded::encode_and_append(const ::rtl::OUString& aString, ::rtl::OStringBuffer& aBuffer)
83cdf0e10cSrcweir {
84cdf0e10cSrcweir     ::rtl::OString utf8String = OUStringToOString(aString, RTL_TEXTENCODING_UTF8);
85cdf0e10cSrcweir     const sal_uInt8 *pString = reinterpret_cast< const sal_uInt8 * >( utf8String.getStr() );
86cdf0e10cSrcweir     sal_Char tmpChar[4]; tmpChar[3] = 0;
87cdf0e10cSrcweir 
88cdf0e10cSrcweir     while( *pString != 0)
89cdf0e10cSrcweir     {
90cdf0e10cSrcweir         if( *pString < 0x80 )
91cdf0e10cSrcweir         {
92cdf0e10cSrcweir             if ( is_unreserved(*pString) ) {
93cdf0e10cSrcweir                 aBuffer.append(*pString);
94cdf0e10cSrcweir             } else if (*pString == 0x20) {
95cdf0e10cSrcweir                 aBuffer.append('+');
96cdf0e10cSrcweir             } else if (*pString == 0x0d && *(pString+1) == 0x0a) {
97cdf0e10cSrcweir                 aBuffer.append("%0D%0A");
98cdf0e10cSrcweir                 pString++;
99cdf0e10cSrcweir             } else if (*pString == 0x0a) {
100cdf0e10cSrcweir                 aBuffer.append("%0D%0A");
101cdf0e10cSrcweir             } else {
102cdf0e10cSrcweir                 snprintf(tmpChar, 3, "%%%X", *pString % 0x100);
103cdf0e10cSrcweir                 aBuffer.append(tmpChar);
104cdf0e10cSrcweir             }
105cdf0e10cSrcweir         } else {
106cdf0e10cSrcweir             snprintf(tmpChar, 3, "%%%X", *pString % 0x100);
107cdf0e10cSrcweir             aBuffer.append(tmpChar);
108cdf0e10cSrcweir             while (*pString >= 0x80) {
109cdf0e10cSrcweir                 // continuation...
110cdf0e10cSrcweir                 pString++;
111cdf0e10cSrcweir                 snprintf(tmpChar, 3, "%%%X", *pString % 0x100);
112cdf0e10cSrcweir                 aBuffer.append(tmpChar);
113cdf0e10cSrcweir             }
114cdf0e10cSrcweir         }
115cdf0e10cSrcweir         pString++;
116cdf0e10cSrcweir     }
117cdf0e10cSrcweir }
118cdf0e10cSrcweir 
serialize_node(const Reference<XNode> & aNode)119cdf0e10cSrcweir void CSerializationURLEncoded::serialize_node(const Reference< XNode >& aNode)
120cdf0e10cSrcweir {
121cdf0e10cSrcweir     // serialize recursive
122cdf0e10cSrcweir     // every element node E that has a text child T will be serialized in document order
123cdf0e10cSrcweir     // <E1>T1<E2>T2</E2></E1><E3>T3</E3> -> E1=T2&E2=T2&E3=T3 (En := local name)
124cdf0e10cSrcweir 
125cdf0e10cSrcweir     // this node
126cdf0e10cSrcweir     Reference< XNodeList > aChildList = aNode->getChildNodes();
127cdf0e10cSrcweir     Reference< XNode > aChild;
128cdf0e10cSrcweir     // is this an element node?
129cdf0e10cSrcweir     if (aNode->getNodeType() == NodeType_ELEMENT_NODE)
130cdf0e10cSrcweir     {
131cdf0e10cSrcweir         ::rtl::OUString  aName = aNode->getNodeName();
132cdf0e10cSrcweir         // find any text children
133cdf0e10cSrcweir         ::rtl::OUStringBuffer aValue;
134cdf0e10cSrcweir         Reference< XText > aText;
135cdf0e10cSrcweir         for(sal_Int32 i=0; i < aChildList->getLength(); i++)
136cdf0e10cSrcweir         {
137cdf0e10cSrcweir             aChild = aChildList->item(i);
138cdf0e10cSrcweir             if (aChild->getNodeType() == NodeType_TEXT_NODE)
139cdf0e10cSrcweir             {
140cdf0e10cSrcweir                 aText = Reference< XText >(aChild, UNO_QUERY);
141cdf0e10cSrcweir                 aValue.append(aText->getData());
142cdf0e10cSrcweir             }
143cdf0e10cSrcweir         }
144cdf0e10cSrcweir 
145cdf0e10cSrcweir         // found anything?
146cdf0e10cSrcweir         if (aValue.getLength() > 0)
147cdf0e10cSrcweir         {
148cdf0e10cSrcweir             ::rtl::OUString aUnencValue = aValue.makeStringAndClear();
149cdf0e10cSrcweir             ::rtl::OStringBuffer aEncodedBuffer;
150cdf0e10cSrcweir             encode_and_append(aName, aEncodedBuffer);
151cdf0e10cSrcweir             aEncodedBuffer.append("=");
152cdf0e10cSrcweir             encode_and_append(aUnencValue, aEncodedBuffer);
153cdf0e10cSrcweir             aEncodedBuffer.append("&");
154cdf0e10cSrcweir             sal_Int8 *pData = (sal_Int8*)aEncodedBuffer.getStr();
155cdf0e10cSrcweir             Sequence< sal_Int8 > sData(pData, aEncodedBuffer.getLength());
156cdf0e10cSrcweir             m_aPipe->writeBytes(sData);
157cdf0e10cSrcweir         }
158cdf0e10cSrcweir     }
159cdf0e10cSrcweir 
160cdf0e10cSrcweir     // element children...
161cdf0e10cSrcweir     for(sal_Int32 i=0; i < aChildList->getLength(); i++)
162cdf0e10cSrcweir     {
163cdf0e10cSrcweir         aChild = aChildList->item(i);
164cdf0e10cSrcweir         // if this is an element node, it might be a candidate for serialization
165cdf0e10cSrcweir         if (aChild.is() && aChild->getNodeType() == NodeType_ELEMENT_NODE)
166cdf0e10cSrcweir             serialize_node(aChild);
167cdf0e10cSrcweir     }
168cdf0e10cSrcweir 
169cdf0e10cSrcweir     // siblings...
170cdf0e10cSrcweir //    Reference< XNode > aSibling = aNode->getNextSibling();
171cdf0e10cSrcweir //    if (aSibling.is())
172cdf0e10cSrcweir //        serialize_node(aSibling);
173cdf0e10cSrcweir 
174cdf0e10cSrcweir }
175cdf0e10cSrcweir 
176cdf0e10cSrcweir /*
177cdf0e10cSrcweir void CSerializationURLEncoded::serialize_nodeset()
178cdf0e10cSrcweir {
179cdf0e10cSrcweir     Reference< XNodeList > aNodeList = m_aXPathObject->getNodeList();
180cdf0e10cSrcweir     for (sal_Int32 i=0; i<aNodeList->getLength(); i++)
181cdf0e10cSrcweir         serialize_node(aNodeList->item(i));
182cdf0e10cSrcweir     m_aPipe->closeOutput();
183cdf0e10cSrcweir }
184cdf0e10cSrcweir */
185cdf0e10cSrcweir 
serialize()186cdf0e10cSrcweir void CSerializationURLEncoded::serialize()
187cdf0e10cSrcweir {
188cdf0e10cSrcweir 
189cdf0e10cSrcweir     // output stream to the pipe buffer
190cdf0e10cSrcweir     Reference< XOutputStream > out(m_aPipe, UNO_QUERY);
191cdf0e10cSrcweir 
192cdf0e10cSrcweir     CSS::uno::Reference< CSS::xml::dom::XNode > cur = m_aFragment->getFirstChild();
193cdf0e10cSrcweir     while (cur.is())
194cdf0e10cSrcweir     {
195cdf0e10cSrcweir         serialize_node(cur);
196cdf0e10cSrcweir         cur = cur->getNextSibling();
197cdf0e10cSrcweir     }
198cdf0e10cSrcweir     m_aPipe->closeOutput();
199cdf0e10cSrcweir }
200cdf0e10cSrcweir 
getInputStream()201cdf0e10cSrcweir Reference< XInputStream > CSerializationURLEncoded::getInputStream()
202cdf0e10cSrcweir {
203cdf0e10cSrcweir     return Reference< XInputStream >(m_aPipe, UNO_QUERY);
204cdf0e10cSrcweir }
205cdf0e10cSrcweir 
206cdf0e10cSrcweir 
207