[452] | 1 | Namespace ActiveBasic
|
---|
| 2 | Namespace Xml
|
---|
| 3 |
|
---|
| 4 |
|
---|
[465] | 5 | Class ParserException
|
---|
| 6 | Inherits System.Exception
|
---|
| 7 | Public
|
---|
| 8 | Sub ParserException( message As String )
|
---|
| 9 | Exception( message )
|
---|
| 10 | End Sub
|
---|
| 11 | End Class
|
---|
| 12 |
|
---|
[452] | 13 | Class Parser
|
---|
[465] | 14 | xmlString As String
|
---|
| 15 | currentIndex As Long
|
---|
| 16 |
|
---|
| 17 | doc As System.Xml.XmlDocument
|
---|
| 18 |
|
---|
| 19 | Static Const tokenLPar = &H3C ' <
|
---|
| 20 | Static Const tokenRPar = &H3E ' >
|
---|
| 21 | Static Const tokenSlash = &H2F ' /
|
---|
| 22 | Static Const xmlHeaderStr = "<?xml"
|
---|
| 23 | Static Const commentHeader = "<!--"
|
---|
| 24 | Static Const cdataHeader = "<![CDATA["
|
---|
| 25 | Static Const dtdHeader = "<!"
|
---|
| 26 | Static Const versionAttributeName = "version"
|
---|
| 27 | Static Const encodingAttributeName = "encoding"
|
---|
| 28 |
|
---|
| 29 | Static Function IsAlpha( c As Char ) As Boolean
|
---|
| 30 | Return ( &H41 <= c and c <= &H5A or &H61 <= c and c <= &H7A )
|
---|
| 31 | End Function
|
---|
| 32 |
|
---|
| 33 | Static Function IsUnderscore( c As Char ) As Boolean
|
---|
| 34 | Return ( c = &H5F )
|
---|
| 35 | End Function
|
---|
| 36 |
|
---|
| 37 | Static Function IsNumber( c As Char ) As Boolean
|
---|
| 38 | Return ( &H30 <= c and c <= &H39 )
|
---|
| 39 | End Function
|
---|
| 40 |
|
---|
| 41 | Static Function IsWhiteSpace( c As Char ) As Boolean
|
---|
| 42 | If c = &H20 Then
|
---|
| 43 | ' 空白
|
---|
| 44 | Return True
|
---|
| 45 | ElseIf c = &H09 Then
|
---|
| 46 | ' タブ文字
|
---|
| 47 | Return True
|
---|
| 48 | ElseIf c = &H0A or c = &H0D Then
|
---|
| 49 | ' 改行
|
---|
| 50 | Return True
|
---|
| 51 | End If
|
---|
| 52 | ' その他
|
---|
| 53 | Return False
|
---|
| 54 | End Function
|
---|
| 55 |
|
---|
| 56 | Sub ts()
|
---|
| 57 | MessageBox(0,xmlString.Substring(currentIndex),"test",0)
|
---|
| 58 | End Sub
|
---|
| 59 |
|
---|
| 60 | Function StringWordEquals( src As String ) As Boolean
|
---|
| 61 | Dim nextChar = xmlString[currentIndex + src.Length] As Char
|
---|
| 62 | Return ( xmlString.Substring( currentIndex, src.Length ) = src and Not (IsAlpha( nextChar ) or IsUnderscore( nextChar ) or IsNumber( nextChar ) ) )
|
---|
| 63 | End Function
|
---|
| 64 |
|
---|
| 65 | Function ReadName() As String
|
---|
| 66 | Dim startIndex = currentIndex
|
---|
| 67 |
|
---|
| 68 | Dim c = xmlString[currentIndex] As Char
|
---|
| 69 |
|
---|
| 70 | If Not( IsAlpha( c ) or IsUnderscore( c ) ) Then
|
---|
| 71 | Throw New ParserException( Ex"タグ名がアルファベットまたはアンダースコアから始まっていない" )
|
---|
| 72 | End If
|
---|
| 73 |
|
---|
| 74 | While IsAlpha( c ) or IsUnderscore( c ) or IsNumber( c )
|
---|
| 75 | currentIndex++
|
---|
| 76 | c = xmlString[currentIndex] As Char
|
---|
| 77 | Wend
|
---|
| 78 |
|
---|
| 79 | Return xmlString.Substring( startIndex, currentIndex - startIndex )
|
---|
| 80 | End Function
|
---|
| 81 |
|
---|
| 82 | Function ReadStringInDoubleQuotes() As String
|
---|
| 83 | ' '\"'分を進める
|
---|
| 84 | currentIndex++
|
---|
| 85 |
|
---|
| 86 | Dim startIndex = currentIndex
|
---|
| 87 | Dim endIndex = 0 As Long
|
---|
| 88 |
|
---|
| 89 | Do
|
---|
| 90 | If xmlString[currentIndex] = 0 Then
|
---|
| 91 | Throw New ParserException( Ex"属性の値の閉じ側のダブルクォートが存在しない" )
|
---|
| 92 | End If
|
---|
| 93 |
|
---|
| 94 | If xmlString[currentIndex] = &H and xmlString[currentIndex+1] = &H22 Then
|
---|
| 95 | ' エスケープシーケンス付きのダブルクォートは無視
|
---|
| 96 | currentIndex += 2
|
---|
| 97 | Continue
|
---|
| 98 | End If
|
---|
| 99 |
|
---|
| 100 | If xmlString[currentIndex] = &H22 Then ' '\"'
|
---|
| 101 | ' 閉じ側のダブルクォート
|
---|
| 102 | endIndex = currentIndex
|
---|
| 103 | currentIndex++
|
---|
| 104 | Exit Do
|
---|
| 105 | End If
|
---|
| 106 |
|
---|
| 107 | currentIndex++
|
---|
| 108 | Loop
|
---|
| 109 |
|
---|
| 110 | Return xmlString.Substring( startIndex, endIndex - startIndex )
|
---|
| 111 | End Function
|
---|
| 112 |
|
---|
| 113 | Function ReadAttribute() As System.Xml.XmlAttribute
|
---|
| 114 | Dim attributeName = ReadName()
|
---|
| 115 | SkipWhiteSpace()
|
---|
| 116 |
|
---|
| 117 | Dim atr = doc.CreateAttribute( attributeName )
|
---|
| 118 |
|
---|
| 119 | If Not xmlString[currentIndex] = &H3D Then ' '='
|
---|
| 120 | Return atr
|
---|
| 121 | End If
|
---|
| 122 |
|
---|
| 123 | currentIndex++ ' '='分を進める
|
---|
| 124 | SkipWhiteSpace()
|
---|
| 125 |
|
---|
| 126 | If Not xmlString[currentIndex] = &H22 Then '\"'
|
---|
| 127 | Throw New ParserException( Ex"属性の値がダブルクォートで囲まれていない" )
|
---|
| 128 | End If
|
---|
| 129 |
|
---|
| 130 | atr.Value = ReadStringInDoubleQuotes()
|
---|
| 131 |
|
---|
| 132 | Return atr
|
---|
| 133 | End Function
|
---|
| 134 |
|
---|
| 135 | Function ReadTextArea() As String
|
---|
| 136 | Dim startIndex = currentIndex
|
---|
| 137 |
|
---|
| 138 | While Not ( xmlString[currentIndex] = tokenLPar or xmlString[currentIndex] = 0 )
|
---|
| 139 | currentIndex++
|
---|
| 140 | Wend
|
---|
| 141 |
|
---|
| 142 | Return xmlString.Substring( startIndex, currentIndex - startIndex )
|
---|
| 143 | End Function
|
---|
| 144 |
|
---|
| 145 | Sub SkipWhiteSpace()
|
---|
| 146 | While IsWhiteSpace( xmlString[currentIndex] )
|
---|
| 147 | currentIndex++
|
---|
| 148 | Wend
|
---|
| 149 | End Sub
|
---|
| 150 |
|
---|
| 151 | Function ParseDeclaration() As System.Xml.XmlDeclaration
|
---|
| 152 | Dim versionStr = Nothing As String
|
---|
| 153 | Dim encodingStr = Nothing As String
|
---|
| 154 | currentIndex += xmlHeaderStr.Length
|
---|
| 155 |
|
---|
| 156 | SkipWhiteSpace()
|
---|
| 157 |
|
---|
| 158 | Do
|
---|
| 159 | If xmlString[currentIndex] = 0 Then
|
---|
| 160 | Throw New ParserException( Ex"タグの閉じ括弧が見つからない" )
|
---|
| 161 | End If
|
---|
| 162 | If xmlString[currentIndex] = tokenRPar Then
|
---|
| 163 | currentIndex ++
|
---|
| 164 | Exit Do
|
---|
| 165 | End If
|
---|
| 166 |
|
---|
| 167 | currentIndex ++
|
---|
| 168 | Loop
|
---|
| 169 |
|
---|
| 170 | Return doc.CreateXmlDeclaration( "1.0", "shift-jis", Nothing )
|
---|
| 171 | End Function
|
---|
| 172 | Function ParseComment() As System.Xml.XmlNode
|
---|
| 173 | End Function
|
---|
| 174 | Function ParseCData() As System.Xml.XmlNode
|
---|
| 175 | End Function
|
---|
| 176 | Function ParseDtd() As System.Xml.XmlNode
|
---|
| 177 | End Function
|
---|
| 178 | Function ParseElement() As System.Xml.XmlElement
|
---|
| 179 | ' '<'分を進める
|
---|
| 180 | currentIndex++
|
---|
| 181 |
|
---|
| 182 | ' タグ名を取得し、要素を作成
|
---|
| 183 | Dim name = ReadName()
|
---|
| 184 | Dim xmlElement = doc.CreateElement( name )
|
---|
| 185 |
|
---|
| 186 | SkipWhiteSpace()
|
---|
| 187 |
|
---|
| 188 | Do
|
---|
| 189 | If xmlString[currentIndex] = 0 Then
|
---|
| 190 | Throw New ParserException( Ex"タグの閉じ括弧が見つからない" )
|
---|
| 191 | End If
|
---|
| 192 | If xmlString[currentIndex] = tokenRPar or ( xmlString[currentIndex] = tokenSlash and xmlString[currentIndex+1] = tokenRPar ) Then
|
---|
| 193 | Exit Do
|
---|
| 194 | End If
|
---|
| 195 |
|
---|
| 196 | ' 属性を取得し、要素に追加
|
---|
| 197 | xmlElement.Attributes.Add( ReadAttribute() )
|
---|
| 198 |
|
---|
| 199 | SkipWhiteSpace()
|
---|
| 200 | Loop
|
---|
| 201 |
|
---|
| 202 | Dim closeTagStr = "</" + xmlElement.LocalName + ">"
|
---|
| 203 |
|
---|
| 204 | If xmlString[currentIndex] = tokenRPar Then ' '>'
|
---|
| 205 | ' ">" で閉じられている
|
---|
| 206 | currentIndex ++
|
---|
| 207 |
|
---|
| 208 | Do
|
---|
| 209 | SkipWhiteSpace()
|
---|
| 210 |
|
---|
| 211 | If xmlString[currentIndex] = 0 Then
|
---|
| 212 | Throw New ParserException( xmlElement.LocalName + Ex"の閉じタグが見つからない" )
|
---|
| 213 | End If
|
---|
| 214 |
|
---|
| 215 | If xmlString[currentIndex] = tokenLPar Then ' '<'
|
---|
| 216 | ' タグ
|
---|
| 217 | If StringWordEquals( closeTagStr ) Then
|
---|
| 218 | ' タグが閉じられた
|
---|
| 219 | currentIndex += closeTagStr.Length
|
---|
| 220 | Exit Do
|
---|
| 221 | End If
|
---|
| 222 |
|
---|
| 223 | xmlElement.AppendChild( ParseNode() )
|
---|
| 224 | Else
|
---|
| 225 | ' タグ以外
|
---|
| 226 | xmlElement.AppendChild( doc.CreateTextNode( ReadTextArea() ) )
|
---|
| 227 | End If
|
---|
| 228 | Loop
|
---|
| 229 | Else
|
---|
| 230 | ' "/>" で閉じられている
|
---|
| 231 | currentIndex += 2
|
---|
| 232 | End If
|
---|
| 233 |
|
---|
| 234 | Return xmlElement
|
---|
| 235 | End Function
|
---|
| 236 |
|
---|
| 237 | Function ParseNode() As System.Xml.XmlNode
|
---|
| 238 | If Not xmlString[currentIndex] = tokenLPar Then
|
---|
| 239 | ' "<" で開始できないとき
|
---|
| 240 | Throw New ParserException( Ex"\q<\q で開始できない" )
|
---|
| 241 | End If
|
---|
| 242 |
|
---|
| 243 | If StringWordEquals( xmlHeaderStr ) Then
|
---|
| 244 | ' XMLヘッダ
|
---|
| 245 | Return ParseDeclaration()
|
---|
| 246 | ElseIf StringWordEquals( commentHeader ) Then
|
---|
| 247 | ' コメントヘッダ
|
---|
| 248 | Return ParseComment()
|
---|
| 249 | ElseIf StringWordEquals( cdataHeader ) Then
|
---|
| 250 | ' CDATAヘッダ
|
---|
| 251 | Return ParseCData()
|
---|
| 252 | ElseIf StringWordEquals( dtdHeader ) Then
|
---|
| 253 | ' DTDヘッダ
|
---|
| 254 | Return ParseDtd()
|
---|
| 255 | Else
|
---|
| 256 | ' その他のタグ
|
---|
| 257 | Return ParseElement()
|
---|
| 258 | End If
|
---|
| 259 | End Function
|
---|
| 260 |
|
---|
[452] | 261 | Public
|
---|
[465] | 262 |
|
---|
| 263 | Sub Parser( xmlString As String, doc As System.Xml.XmlDocument )
|
---|
| 264 | This.xmlString = xmlString
|
---|
| 265 | This.doc = doc
|
---|
| 266 | End Sub
|
---|
| 267 |
|
---|
| 268 | Sub Parse()
|
---|
| 269 | This.currentIndex = 0
|
---|
| 270 | This.doc.RemoveAll()
|
---|
| 271 |
|
---|
| 272 | SkipWhiteSpace()
|
---|
| 273 |
|
---|
| 274 | While currentIndex < xmlString.Length
|
---|
| 275 |
|
---|
| 276 | This.doc.AppendChild( ParseNode() )
|
---|
| 277 |
|
---|
| 278 | SkipWhiteSpace()
|
---|
| 279 | Wend
|
---|
| 280 | End Sub
|
---|
| 281 |
|
---|
| 282 | Static Sub Parse( xmlString As String, doc As System.Xml.XmlDocument )
|
---|
| 283 | Dim parser = New Parser( xmlString, doc )
|
---|
| 284 | parser.Parse()
|
---|
| 285 | End Sub
|
---|
[452] | 286 | End Class
|
---|
| 287 |
|
---|
| 288 |
|
---|
| 289 | End Namespace
|
---|
| 290 | End Namespace
|
---|