File: XMLPredefinedEntityReferenceResolver.java

package info (click to toggle)
libjboss-web-services-java 0.0%2Bsvn5660-2
  • links: PTS, VCS
  • area: contrib
  • in suites: lenny
  • size: 7,268 kB
  • ctags: 12,475
  • sloc: java: 79,207; xml: 38; makefile: 19; sh: 15
file content (123 lines) | stat: -rw-r--r-- 3,755 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
/*
* JBoss, Home of Professional Open Source
* Copyright 2005, JBoss Inc., and individual contributors as indicated
* by the @authors tag. See the copyright.txt in the distribution for a
* full listing of individual contributors.
*
* This is free software; you can redistribute it and/or modify it
* under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of
* the License, or (at your option) any later version.
*
* This software is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this software; if not, write to the Free
* Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
* 02110-1301 USA, or see the FSF site: http://www.fsf.org.
*/
package org.jboss.ws.core.utils;

import java.util.HashMap;

/**
 * Utility class for resolving predefined XML entity and character references.
 *
 * @author <a href="mailto:jason.greene@jboss.com">Jason T. Greene</a>
 * @version $Revision: 1757 $
 */
public class XMLPredefinedEntityReferenceResolver
{
   private static HashMap<String, Character> entities = new HashMap<String, Character>();

   static
   {
      entities.put("quot", '"');
      entities.put("amp", '&');
      entities.put("lt", '<');
      entities.put("gt", '>');
      entities.put("apos", '\'');
   }

   private static int resolveCharRef(String source, int pos, StringBuilder builder)
   {
      int radix = 10;
      if (source.charAt(pos += 2) == 'x')
      {
         pos++;
         radix = 16;
      }

      int end = source.indexOf(';', pos);
      if (end == -1)
         throw new IllegalArgumentException("Invalid character reference");

      int c = Integer.parseInt(source.substring(pos, end), radix);
      builder.append((char) c);

      return end + 1;
   }

   private static int resolveEntityRef(String source, int pos, StringBuilder builder)
   {
      int end = source.indexOf(';', ++pos);
      if (end == -1)
         throw new IllegalArgumentException("Invalid entity reference");

      String entity = source.substring(pos, end);
      Character c = entities.get(entity);
      if (c == null)
         throw new IllegalArgumentException("Invalid entity: " + entity);

      builder.append(c.charValue());

      return end + 1;
   }

   /**
    * Transforms an XML normalized string by resolving all predefined character and entity references
    *
    * @param normalized an XML normalized string
    * @return a standard java string that is no longer XML normalized
    */
   public static String resolve(String normalized)
   {
      StringBuilder builder = new StringBuilder();
      int end = normalized.length();
      int pos = normalized.indexOf('&');
      int last = 0;

      // No references
      if (pos == -1)
         return normalized;

      while (pos != -1)
      {
         String sub = normalized.subSequence(last, pos).toString();
         builder.append(sub);
         
         int peek = pos + 1;
         if (peek == end)
            throw new IllegalArgumentException("Invalid entity reference");

         if (normalized.charAt(peek) == '#')
            pos = resolveCharRef(normalized, pos, builder);
         else
            pos = resolveEntityRef(normalized, pos, builder);

         last = pos;
         pos = normalized.indexOf('&', pos);
      }

      if (last < end)
      {
         String sub = normalized.subSequence(last, end).toString();
         builder.append(sub);
      }

      return builder.toString();
   }
}