/ - Diff - gvSIG scripting - gvSIG

Revision 548

     /* gvSIG. Geographic Information System of the Valencian Government
+     *
      * Copyright (C) 2007-2008 Infrastructures and Transports Department
      * of the Valencian Government (CIT)
+     *
      * This program is free software; you can redistribute it and/or
      * modify it under the terms of the GNU General Public License
      * as published by the Free Software Foundation; either version 2
      * of the License, or (at your option) any later version.
+     *
      * This program is distributed in the hope that it will be useful,
      * but WITHOUT ANY WARRANTY; without even the implied warranty of
      * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
      * GNU General Public License for more details.
+     *
      * You should have received a copy of the GNU General Public License
      * along with this program; if not, write to the Free Software
      * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
      * MA  02110-1301, USA.
+     *
      */
     package org.gvsig.scripting.app.extension;
     import junit.framework.Test;
     import junit.framework.TestCase;
     import junit.framework.TestSuite;
     /**
      * Unit test for simple App.
      */
     public class AppTest
         extends TestCase
+    {
         /**
          * Create the test case
+         *
          * @param testName name of the test case
          */
         public AppTest( String testName )
+        {
             super( testName );
+        }
         /**
          * @return the suite of tests being tested
          */
         public static Test suite()
+        {
             return new TestSuite( AppTest.class );
+        }
         /**
          * Rigourous Test :-)
          */
         public void testApp()
+        {
             assertTrue( true );
+        }
+    }

     #!/bin/sh
     #set -x
     cd $(dirname $0)
     if [ -f lib/org.gvsig.andami-2* ] ; then
       GVSIG_HOME=`dirname "$0"`
     else
       if [ -f lib/org.gvsig.scripting.main-* ] ; then
         GVSIG_HOME=`dirname "$0"`/../../..
       else
         echo "Can't locate gvSIG installation folder"
         exit 1
       fi
     fi
     cd "${GVSIG_HOME}"
     GVSIG_HOME=$PWD
     for d in gvSIG/extensiones/org.gvsig.app/lib \
       gvSIG/extensiones/org.gvsig.scripting.app.extension/lib \
       gvSIG/extensiones/org.gvsig.geometry.app.generalpath/lib \
       gvSIG/extensiones/org.gvsig.projection.app.proj4j/lib \
       gvSIG/extensiones/org.gvsig.projection.app.jcrs/lib ;
       do
       for i in $d/*.jar ; do
         LIBRARIES="$LIBRARIES:$i"
       done
       for i in $d/*.zip ; do
         LIBRARIES="$LIBRARIES:$i"
       done
     done
     GVSIG_LAUNCHER=org.gvsig.scripting.main.Main
     GVSIG_CLASSPATH="$LIBRARIES"
     GVSIG_PARAMS=" --plugins-folder=gvSIG/extensiones $@"
     . ./gvSIG.sh

     <?xml version="1.0"?>
     <!--
     Definitions of plugin persistence org.gvsig.scripting.app.mainplugin.
      -->
     <definitions>
       <version>1.0.0</version>
       <classes>
         <class name="org.gvsig.scripting.app.mainplugin">
           <description>Persistence of scripting plugin</description>
           <fields>
             <field name="ComposerUseHisWindowManager" type="boolean" mandatory="true" defaultValue="true">
               <description>When true the composer use his window manager instead of the gvSIG Window manager.</description>
             </field>
           </fields>
         </class>
       </classes>
     </definitions>

     _Scripting=Scripting
     _Show_scripting_launcher=Abrir lanzador de scripts
     _Show_scripting_composer=Abrir editor de scripts
     _Show_scripting_jython_console=Abrir consola Jython
     User=Usuario
     System=Sistema
     Accept=Aceptar
     Cancel=Cancelar
     Apply=Aplicar
     Retrieving_data=Recibiendo datos...
     File=Fichero
     New=Nuevo
     Close_document=Cerrar documento
     Close_all_documents=Cerrar todos los documentos
     Run=Ejecutar
     Save=Guardar
     Close=Cerrar
     Close_current_tab=Cerrar pesta\u00f1a actual
     Open_edition_mode=Abrir modo edici\u00f3n
     Run_selected_script=Ejecutar script seleccionado
     Delete_selected_script=Borrar script seleccionado
     Refresh_directories=Actualizar carpetas
     Move_files=Mover ficheros
     Set_file_preferences=Editar preferencias de fichero
     Edit=Editar
     Cut=Cortar
     Copy=Copiar
     Paste=Pegar
     Select_all=Seleccionar todo
     Tools=Herramientas
     Launcher=Lanzador de scripts
     Scripting_Launcher=Lanzador de scripts
     Scripting_Composer=Editor de scripts
     Jython_Console=Consola Jython
     Import_JavaDoc=Importar JavaDoc
     JavaDoc=Ayuda de Java (JavaDoc)
     Remove_JavaDoc=Eliminar JavaDoc
     Help_contents=Contenido de la ayuda
     About_scripts_editor=Acerca del editor de scripts
     Get_help=Ayuda
     Help=Ayuda
     _Package_script=Empaquetar script...
     _Package_help=Empaquetar ayuda...
     Problems=Errores
     Console=Consola
     Description=Descripci\u00f3n
     Resource=Recurso
     Location=Ubicaci\u00f3n
     no_line=sin l\u00ednea
     Line=L\u00ednea
     Welcome_message=Bienvenido al entorno de scripting v1.0
     Error_opening_in_edition_mode_title=Error al abrir fichero
     Error_opening_in_edition_mode=No se pudo abrir el fichero en modo edici\u00f3n
     New_Script=Nuevo elemento
     New_Script_Description=Crea un nuevo script, di\u00e1logo, proyecto, directorio
     Deleting_JavaDocs_successfully_title=Operaci\u00f3n realizada con \u00e9xito
     Deleting_JavaDocs_successfully=Eliminaci\u00f3n de los JavaDocs exitosa
     Import_JavaDoc_title=Importar JavaDocs desde los directorios de sistema al ScriptingFramework JavaDoc
     Remove_JavaDoc_title=Eliminar JavaDocs del ScriptingFramework JavaDoc
     projects_modified_title=Proyectos sin guardar
     projects_modified=Algunos proyectos han sido modificados.\u00bfSalvar cambios?
     project_modified=ha sido modificado.\u00bfSalvar cambios?
     Delete_all_title=Borrar el proyecto
     Delete_all_message=Esta acci\u00f3n elimina el directorio y todo su contenido. \u00bfContinuar?
     About_us_title=Informaci\u00f3n de todos los contribuidores al proyecto gvSIG
     Success=Operaci\u00f3n realizada con \u00e9xito
     Error=Error
     Error_renaming=Inesperado error renombrando el fichero
     Error_moving=Inesperado error moviendo el fichero
     Error_help=Selecciona una ayuda
     Rename_succesfully=Renombrado del fichero realizado con \u00e9xito
     Select_first=Debe seleccionar un fichero primero
     help_key=No hay ayuda para el texto
     script_filesystem=script en el \u00e1rbol de directorio
     Move=Mover
     move_desc=Cambia la ubicaci\u00f3n del fichero seleccionado
     Rename=Renombrar
     rename_desc=Cambia el nombre y otras propiedades del fichero seleccionado
     Moving_succesfully=Reubicaci\u00f3n del fichero realizado con \u00e9xito
     Dialog=Di\u00e1logo
     Code=C\u00f3digo
     Properties=Propiedades
     current_name=Nombre actual
     new_name=Nuevo name
     rename_name_title=Cambiar el nombre del fichero
     more_properties=M\u00e1s propiedades
     Javadoc_remove=Selecciona el JavaDoc a eliminar
     no_Javadoc_remove=No hay JavaDoc para eliminar
     Name=Nombre
     Version=Versi\u00f3n
     Created_by=Creado por
     Description=Descripci\u00f3n
     Type=Tipo
     Language=Lenguaje
     Author=Autor
     Move_from=Mover desde
     Move_to=Destino
     Browse=Abrir
     Import_from=Importar desde
     Name_blank=El nombre no puede estar en blanco
     Name_exists=Este nombre ya existe. Debe elegir otro
     Import_success=Los JavaDocs se han importado satisfactoriamente
     JavaDoc_Error=Selecciona JavaDoc a importar
     go_to_line_Xhorizontal_ellipsisX=Ir a la l\u00ednea\u2026
     find_Xhorizontal_ellipsisX=Buscar\u2026
     replace_Xhorizontal_ellipsisX=Reemplazar\u2026
     _Searching_autorun_scripts_Xhorizontal_ellipsisX=Buscando scripts de autoarranque...
     _Running_autorun_script_from_XnameX=Ejecutando script de autoarranque desde {0}

     _Scripting=Scripting
     _Show_scripting_launcher=Show scripting launcher
     _Show_scripting_composer=Show scripting composer
     _Show_scripting_jython_console=Show Jython console
     User=User
     System=System
     Accept=Accept
     Cancel=Cancel
     Apply=Apply
     Retrieving_data=Retrieving data...
     File=File
     New=New
     Close_document=Close document
     Close_all_documents=Cloase all documents
     Run=Run
     Save=Save
     Close=Close
     Close_current_tab=Close current tab
     Open_edition_mode=Open edition mode
     Run_selected_script=Run selected script
     Delete_selected_script=Delete selected script
     Refresh_directories=Refresh directories
     Move_files=Move files
     Set_file_preferences=Set file preferences
     _Running_autorun_script_from_XnameX=Running autorun script from {0}
     Edit=Edit
     Cut=Cut
     Copy=Copy
     Paste=Paste
     Select_all=Select all
     Tools=Tools
     Launcher=Scripting Launcher
     Scripting_Launcher=Scripting Launcher
     Scripting_Composer=Scripting Composer
     Jython_Console=Jython console
     Import_JavaDoc=Import JavaDoc
     JavaDoc=Java Help (JavaDoc)
     Remove_JavaDoc=Remove JavaDoc
     Help_contents=Help contents
     About_scripts_editor=About scripts editor
     Get_help=Help
     Help=Help
     _Package_script=Package script...
     _Package_help=Package help...
     Problems=Errors
     Console=Console
     Description=Description
     Resource=Resource
     Location=Location
     no_line=no line
     Line=Line
     Welcome_message=Welcome to the scripting framework v1.0
     Error_opening_in_edition_mode_title=Error opening file in edition mode
     Error_opening_in_edition_mode=The file can't be opened in edition mode
     New_Script=New element
     New_Script_Description=Create a new script, dialog, project, directory
     Deleting_JavaDocs_successfully_title=Operation successful
     Deleting_JavaDocs_successfully=Deleting JavaDocs successfully
     Import_JavaDoc_title=Import JavaDocs from filesystem to ScriptingFramework JavaDoc
     Remove_JavaDoc_title=Remove JavaDocs from ScriptingFramework JavaDoc
     projects_modified_title=Projects without saving
     projects_modified=Some projects have been modified. Save changes?
     project_modified=has been modified. Save changes?
     Delete_all_title=Delete project
     Delete_all_message=This action removes the directory and all its content. Continue?
     About_us_title=Information about all the gvSIG's contributors
     Success=Operation done successfully
     Error=Error
     Error_renaming=Unexpected error renaming the file
     Error_moving=Unexpected error moving the file
     Error_help=Select help
     Rename_succesfully=Renaming successfully
     Select_first=Select a file first
     help_key=There isn't any help to this text
     script_filesystem=script filesystem
     Move=Move
     move_desc=Change location of selected file
     Rename=Rename
     rename_desc=Change the name and more properties of the selected file
     Moving_succesfully=File moved succesfully
     Dialog=Dialog
     Code=Code
     Properties=Properties
     current_name=Current name
     new_name=New name
     rename_name_title=Change filename
     more_properties=more properties
     Javadoc_remove=Choose JavaDoc to delete
     no_Javadoc_remove=There's no JavaDoc to delete
     Name=Name
     Version=Version
     Created_by=Create by
     Description=Description
     Type=Type
     Language=Language
     Author=Author
     Move_from=Move from
     Move_to=Move to
     Browse=Browse
     Import_from=Import from
     Name_blank=Name can't be blank
     Name_exists=This name already exists. Choose another one
     Import_success=JavaDocs imported successfully
     JavaDoc_Error=Select JavaDoc to import
     go_to_line_Xhorizontal_ellipsisX=Go To Line\u2026
     find_Xhorizontal_ellipsisX=Find\u2026
     replace_Xhorizontal_ellipsisX=Replace\u2026
     _Searching_autorun_scripts_Xhorizontal_ellipsisX=Searching autorun scripts...
     _Running_autorun_script_from_XnameX=Running autorun script from {0}

     """Beautiful Soup
     Elixir and Tonic
     "The Screen-Scraper's Friend"
     http://www.crummy.com/software/BeautifulSoup/
     Beautiful Soup parses a (possibly invalid) XML or HTML document into a
     tree representation. It provides methods and Pythonic idioms that make
     it easy to navigate, search, and modify the tree.
     A well-formed XML/HTML document yields a well-formed data
     structure. An ill-formed XML/HTML document yields a correspondingly
     ill-formed data structure. If your document is only locally
     well-formed, you can use this library to find and process the
     well-formed part of it.
     Beautiful Soup works with Python 2.2 and up. It has no external
     dependencies, but you'll have more success at converting data to UTF-8
     if you also install these three packages:
     * chardet, for auto-detecting character encodings
       http://chardet.feedparser.org/
     * cjkcodecs and iconv_codec, which add more encodings to the ones supported
       by stock Python.
       http://cjkpython.i18n.org/
     Beautiful Soup defines classes for two main parsing strategies:
      * BeautifulStoneSoup, for parsing XML, SGML, or your domain-specific
        language that kind of looks like XML.
      * BeautifulSoup, for parsing run-of-the-mill HTML code, be it valid
        or invalid. This class has web browser-like heuristics for
        obtaining a sensible parse tree in the face of common HTML errors.
     Beautiful Soup also defines a class (UnicodeDammit) for autodetecting
     the encoding of an HTML or XML document, and converting it to
     Unicode. Much of this code is taken from Mark Pilgrim's Universal Feed Parser.
     For more than you ever wanted to know about Beautiful Soup, see the
     documentation:
     http://www.crummy.com/software/BeautifulSoup/documentation.html
     Here, have some legalese:
     Copyright (c) 2004-2010, Leonard Richardson
     All rights reserved.
     Redistribution and use in source and binary forms, with or without
     modification, are permitted provided that the following conditions are
     met:
       * Redistributions of source code must retain the above copyright
         notice, this list of conditions and the following disclaimer.
       * Redistributions in binary form must reproduce the above
         copyright notice, this list of conditions and the following
         disclaimer in the documentation and/or other materials provided
         with the distribution.
       * Neither the name of the the Beautiful Soup Consortium and All
         Night Kosher Bakery nor the names of its contributors may be
         used to endorse or promote products derived from this software
         without specific prior written permission.
     THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
     A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
     CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
     EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
     PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
     LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
     NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
     SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE, DAMMIT.
     """
     from __future__ import generators
     __author__ = "Leonard Richardson (leonardr@segfault.org)"
     __version__ = "3.2.1"
     __copyright__ = "Copyright (c) 2004-2012 Leonard Richardson"
     __license__ = "New-style BSD"
     from sgmllib import SGMLParser, SGMLParseError
     import codecs
     import markupbase
     import types
     import re
     import sgmllib
     try:
       from htmlentitydefs import name2codepoint
     except ImportError:
       name2codepoint = {}
     try:
         set
     except NameError:
         from sets import Set as set
     #These hacks make Beautiful Soup able to parse XML with namespaces
     sgmllib.tagfind = re.compile('[a-zA-Z][-_.:a-zA-Z0-9]*')
     markupbase._declname_match = re.compile(r'[a-zA-Z][-_.:a-zA-Z0-9]*\s*').match
     DEFAULT_OUTPUT_ENCODING = "utf-8"
     def _match_css_class(str):
         """Build a RE to match the given CSS class."""
         return re.compile(r"(^|.*\s)%s($|\s)" % str)
     # First, the classes that represent markup elements.
     class PageElement(object):
         """Contains the navigational information for some part of the page
         (either a tag or a piece of text)"""
         def _invert(h):
             "Cheap function to invert a hash."
             i = {}
             for k,v in h.items():
                 i[v] = k
             return i
         XML_ENTITIES_TO_SPECIAL_CHARS = { "apos" : "'",
                                           "quot" : '"',
                                           "amp" : "&",
                                           "lt" : "<",
                                           "gt" : ">" }
         XML_SPECIAL_CHARS_TO_ENTITIES = _invert(XML_ENTITIES_TO_SPECIAL_CHARS)
         def setup(self, parent=None, previous=None):
             """Sets up the initial relations between this element and
             other elements."""
             self.parent = parent
             self.previous = previous
             self.next = None
             self.previousSibling = None
             self.nextSibling = None
             if self.parent and self.parent.contents:
                 self.previousSibling = self.parent.contents[-1]
                 self.previousSibling.nextSibling = self
         def replaceWith(self, replaceWith):
             oldParent = self.parent
             myIndex = self.parent.index(self)
             if hasattr(replaceWith, "parent")\
                       and replaceWith.parent is self.parent:
                 # We're replacing this element with one of its siblings.
                 index = replaceWith.parent.index(replaceWith)
                 if index and index < myIndex:
                     # Furthermore, it comes before this element. That
                     # means that when we extract it, the index of this
                     # element will change.
                     myIndex = myIndex - 1
             self.extract()
             oldParent.insert(myIndex, replaceWith)
         def replaceWithChildren(self):
             myParent = self.parent
             myIndex = self.parent.index(self)
             self.extract()
             reversedChildren = list(self.contents)
             reversedChildren.reverse()
             for child in reversedChildren:
                 myParent.insert(myIndex, child)
         def extract(self):
             """Destructively rips this element out of the tree."""
             if self.parent:
                 try:
                     del self.parent.contents[self.parent.index(self)]
                 except ValueError:
                     pass
             #Find the two elements that would be next to each other if
             #this element (and any children) hadn't been parsed. Connect
             #the two.
             lastChild = self._lastRecursiveChild()
             nextElement = lastChild.next
             if self.previous:
                 self.previous.next = nextElement
             if nextElement:
                 nextElement.previous = self.previous
             self.previous = None
             lastChild.next = None
             self.parent = None
             if self.previousSibling:
                 self.previousSibling.nextSibling = self.nextSibling
             if self.nextSibling:
                 self.nextSibling.previousSibling = self.previousSibling
             self.previousSibling = self.nextSibling = None
             return self
         def _lastRecursiveChild(self):
             "Finds the last element beneath this object to be parsed."
             lastChild = self
             while hasattr(lastChild, 'contents') and lastChild.contents:
                 lastChild = lastChild.contents[-1]
             return lastChild
         def insert(self, position, newChild):
             if isinstance(newChild, basestring) \
                 and not isinstance(newChild, NavigableString):
                 newChild = NavigableString(newChild)
             position =  min(position, len(self.contents))
             if hasattr(newChild, 'parent') and newChild.parent is not None:
                 # We're 'inserting' an element that's already one
                 # of this object's children.
                 if newChild.parent is self:
                     index = self.index(newChild)
                     if index > position:
                         # Furthermore we're moving it further down the
                         # list of this object's children. That means that
                         # when we extract this element, our target index
                         # will jump down one.
                         position = position - 1
                 newChild.extract()
             newChild.parent = self
             previousChild = None
             if position == 0:
                 newChild.previousSibling = None
                 newChild.previous = self
             else:
                 previousChild = self.contents[position-1]
                 newChild.previousSibling = previousChild
                 newChild.previousSibling.nextSibling = newChild
                 newChild.previous = previousChild._lastRecursiveChild()
             if newChild.previous:
                 newChild.previous.next = newChild
             newChildsLastElement = newChild._lastRecursiveChild()
             if position >= len(self.contents):
                 newChild.nextSibling = None
                 parent = self
                 parentsNextSibling = None
                 while not parentsNextSibling:
                     parentsNextSibling = parent.nextSibling
                     parent = parent.parent
                     if not parent: # This is the last element in the document.
                         break
                 if parentsNextSibling:
                     newChildsLastElement.next = parentsNextSibling
                 else:
                     newChildsLastElement.next = None
             else:
                 nextChild = self.contents[position]
                 newChild.nextSibling = nextChild
                 if newChild.nextSibling:
                     newChild.nextSibling.previousSibling = newChild
                 newChildsLastElement.next = nextChild
             if newChildsLastElement.next:
                 newChildsLastElement.next.previous = newChildsLastElement
             self.contents.insert(position, newChild)
         def append(self, tag):
             """Appends the given tag to the contents of this tag."""
             self.insert(len(self.contents), tag)
         def findNext(self, name=None, attrs={}, text=None, **kwargs):
             """Returns the first item that matches the given criteria and
             appears after this Tag in the document."""
             return self._findOne(self.findAllNext, name, attrs, text, **kwargs)
         def findAllNext(self, name=None, attrs={}, text=None, limit=None,
                         **kwargs):
             """Returns all items that match the given criteria and appear
             after this Tag in the document."""
             return self._findAll(name, attrs, text, limit, self.nextGenerator,
                                  **kwargs)
         def findNextSibling(self, name=None, attrs={}, text=None, **kwargs):
             """Returns the closest sibling to this Tag that matches the
             given criteria and appears after this Tag in the document."""
             return self._findOne(self.findNextSiblings, name, attrs, text,
                                  **kwargs)
         def findNextSiblings(self, name=None, attrs={}, text=None, limit=None,
                              **kwargs):
             """Returns the siblings of this Tag that match the given
             criteria and appear after this Tag in the document."""
             return self._findAll(name, attrs, text, limit,
                                  self.nextSiblingGenerator, **kwargs)
         fetchNextSiblings = findNextSiblings # Compatibility with pre-3.x
         def findPrevious(self, name=None, attrs={}, text=None, **kwargs):
             """Returns the first item that matches the given criteria and
             appears before this Tag in the document."""
             return self._findOne(self.findAllPrevious, name, attrs, text, **kwargs)
         def findAllPrevious(self, name=None, attrs={}, text=None, limit=None,
                             **kwargs):
             """Returns all items that match the given criteria and appear
             before this Tag in the document."""
             return self._findAll(name, attrs, text, limit, self.previousGenerator,
                                **kwargs)
         fetchPrevious = findAllPrevious # Compatibility with pre-3.x
         def findPreviousSibling(self, name=None, attrs={}, text=None, **kwargs):
             """Returns the closest sibling to this Tag that matches the
             given criteria and appears before this Tag in the document."""
             return self._findOne(self.findPreviousSiblings, name, attrs, text,
                                  **kwargs)
         def findPreviousSiblings(self, name=None, attrs={}, text=None,
                                  limit=None, **kwargs):
             """Returns the siblings of this Tag that match the given
             criteria and appear before this Tag in the document."""
             return self._findAll(name, attrs, text, limit,
                                  self.previousSiblingGenerator, **kwargs)
         fetchPreviousSiblings = findPreviousSiblings # Compatibility with pre-3.x
         def findParent(self, name=None, attrs={}, **kwargs):
             """Returns the closest parent of this Tag that matches the given
             criteria."""
             # NOTE: We can't use _findOne because findParents takes a different
             # set of arguments.
             r = None
             l = self.findParents(name, attrs, 1)
             if l:
                 r = l[0]
             return r
         def findParents(self, name=None, attrs={}, limit=None, **kwargs):
             """Returns the parents of this Tag that match the given
             criteria."""
             return self._findAll(name, attrs, None, limit, self.parentGenerator,
                                  **kwargs)
         fetchParents = findParents # Compatibility with pre-3.x
         #These methods do the real heavy lifting.
         def _findOne(self, method, name, attrs, text, **kwargs):
             r = None
             l = method(name, attrs, text, 1, **kwargs)
             if l:
                 r = l[0]
             return r
         def _findAll(self, name, attrs, text, limit, generator, **kwargs):
             "Iterates over a generator looking for things that match."
             if isinstance(name, SoupStrainer):
                 strainer = name
             # (Possibly) special case some findAll*(...) searches
             elif text is None and not limit and not attrs and not kwargs:
                 # findAll*(True)
                 if name is True:
                     return [element for element in generator()
                             if isinstance(element, Tag)]
                 # findAll*('tag-name')
                 elif isinstance(name, basestring):
                     return [element for element in generator()
                             if isinstance(element, Tag) and
                             element.name == name]
                 else:
                     strainer = SoupStrainer(name, attrs, text, **kwargs)
             # Build a SoupStrainer
             else:
                 strainer = SoupStrainer(name, attrs, text, **kwargs)
             results = ResultSet(strainer)
             g = generator()
             while True:
                 try:
                     i = g.next()
                 except StopIteration:
                     break
                 if i:
                     found = strainer.search(i)
                     if found:
                         results.append(found)
                         if limit and len(results) >= limit:
                             break
             return results
         #These Generators can be used to navigate starting from both
         #NavigableStrings and Tags.
         def nextGenerator(self):
             i = self
             while i is not None:
                 i = i.next
                 yield i
         def nextSiblingGenerator(self):
             i = self
             while i is not None:
                 i = i.nextSibling
                 yield i
         def previousGenerator(self):
             i = self
             while i is not None:
                 i = i.previous
                 yield i
         def previousSiblingGenerator(self):
             i = self
             while i is not None:
                 i = i.previousSibling
                 yield i
         def parentGenerator(self):
             i = self
             while i is not None:
                 i = i.parent
                 yield i
         # Utility methods
         def substituteEncoding(self, str, encoding=None):
             encoding = encoding or "utf-8"
             return str.replace("%SOUP-ENCODING%", encoding)
         def toEncoding(self, s, encoding=None):
             """Encodes an object to a string in some encoding, or to Unicode.
             ."""
             if isinstance(s, unicode):
                 if encoding:
                     s = s.encode(encoding)
             elif isinstance(s, str):
                 if encoding:
                     s = s.encode(encoding)
                 else:
                     s = unicode(s)
             else:
                 if encoding:
                     s  = self.toEncoding(str(s), encoding)
                 else:
                     s = unicode(s)
             return s
         BARE_AMPERSAND_OR_BRACKET = re.compile("([<>]|"
                                                + "&(?!#\d+;|#x[0-9a-fA-F]+;|\w+;)"
                                                + ")")
         def _sub_entity(self, x):
             """Used with a regular expression to substitute the
             appropriate XML entity for an XML special character."""
             return "&" + self.XML_SPECIAL_CHARS_TO_ENTITIES[x.group(0)[0]] + ";"
     class NavigableString(unicode, PageElement):
         def __new__(cls, value):
             """Create a new NavigableString.
             When unpickling a NavigableString, this method is called with
             the string in DEFAULT_OUTPUT_ENCODING. That encoding needs to be
             passed in to the superclass's __new__ or the superclass won't know
             how to handle non-ASCII characters.
             """
             if isinstance(value, unicode):
                 return unicode.__new__(cls, value)
             return unicode.__new__(cls, value, DEFAULT_OUTPUT_ENCODING)
         def __getnewargs__(self):
             return (NavigableString.__str__(self),)
         def __getattr__(self, attr):
             """text.string gives you text. This is for backwards
             compatibility for Navigable*String, but for CData* it lets you
             get the string without the CData wrapper."""
             if attr == 'string':
                 return self
             else:
                 raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__.__name__, attr)
         def __unicode__(self):
             return str(self).decode(DEFAULT_OUTPUT_ENCODING)
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             # Substitute outgoing XML entities.
             data = self.BARE_AMPERSAND_OR_BRACKET.sub(self._sub_entity, self)
             if encoding:
                 return data.encode(encoding)
             else:
                 return data
     class CData(NavigableString):
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             return "<![CDATA[%s]]>" % NavigableString.__str__(self, encoding)
     class ProcessingInstruction(NavigableString):
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             output = self
             if "%SOUP-ENCODING%" in output:
                 output = self.substituteEncoding(output, encoding)
             return "<?%s?>" % self.toEncoding(output, encoding)
     class Comment(NavigableString):
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             return "<!--%s-->" % NavigableString.__str__(self, encoding)
     class Declaration(NavigableString):
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             return "<!%s>" % NavigableString.__str__(self, encoding)
     class Tag(PageElement):
         """Represents a found HTML tag with its attributes and contents."""
         def _convertEntities(self, match):
             """Used in a call to re.sub to replace HTML, XML, and numeric
             entities with the appropriate Unicode characters. If HTML
             entities are being converted, any unrecognized entities are
             escaped."""
             x = match.group(1)
             if self.convertHTMLEntities and x in name2codepoint:
                 return unichr(name2codepoint[x])
             elif x in self.XML_ENTITIES_TO_SPECIAL_CHARS:
                 if self.convertXMLEntities:
                     return self.XML_ENTITIES_TO_SPECIAL_CHARS[x]
                 else:
                     return u'&%s;' % x
             elif len(x) > 0 and x[0] == '#':
                 # Handle numeric entities
                 if len(x) > 1 and x[1] == 'x':
                     return unichr(int(x[2:], 16))
                 else:
                     return unichr(int(x[1:]))
             elif self.escapeUnrecognizedEntities:
                 return u'&amp;%s;' % x
             else:
                 return u'&%s;' % x
         def __init__(self, parser, name, attrs=None, parent=None,
                      previous=None):
             "Basic constructor."
             # We don't actually store the parser object: that lets extracted
             # chunks be garbage-collected
             self.parserClass = parser.__class__
             self.isSelfClosing = parser.isSelfClosingTag(name)
             self.name = name
             if attrs is None:
                 attrs = []
             elif isinstance(attrs, dict):
                 attrs = attrs.items()
             self.attrs = attrs
             self.contents = []
             self.setup(parent, previous)
             self.hidden = False
             self.containsSubstitutions = False
             self.convertHTMLEntities = parser.convertHTMLEntities
             self.convertXMLEntities = parser.convertXMLEntities
             self.escapeUnrecognizedEntities = parser.escapeUnrecognizedEntities
             # Convert any HTML, XML, or numeric entities in the attribute values.
             convert = lambda(k, val): (k,
                                        re.sub("&(#\d+|#x[0-9a-fA-F]+|\w+);",
                                               self._convertEntities,
                                               val))
             self.attrs = map(convert, self.attrs)
         def getString(self):
             if (len(self.contents) == 1
                 and isinstance(self.contents[0], NavigableString)):
                 return self.contents[0]
         def setString(self, string):
             """Replace the contents of the tag with a string"""
             self.clear()
             self.append(string)
         string = property(getString, setString)
         def getText(self, separator=u""):
             if not len(self.contents):
                 return u""
             stopNode = self._lastRecursiveChild().next
             strings = []
             current = self.contents[0]
             while current is not stopNode:
                 if isinstance(current, NavigableString):
                     strings.append(current.strip())
                 current = current.next
             return separator.join(strings)
         text = property(getText)
         def get(self, key, default=None):
             """Returns the value of the 'key' attribute for the tag, or
             the value given for 'default' if it doesn't have that
             attribute."""
             return self._getAttrMap().get(key, default)
         def clear(self):
             """Extract all children."""
             for child in self.contents[:]:
                 child.extract()
         def index(self, element):
             for i, child in enumerate(self.contents):
                 if child is element:
                     return i
             raise ValueError("Tag.index: element not in tag")
         def has_key(self, key):
             return self._getAttrMap().has_key(key)
         def __getitem__(self, key):
             """tag[key] returns the value of the 'key' attribute for the tag,
             and throws an exception if it's not there."""
             return self._getAttrMap()[key]
         def __iter__(self):
             "Iterating over a tag iterates over its contents."
             return iter(self.contents)
         def __len__(self):
             "The length of a tag is the length of its list of contents."
             return len(self.contents)
         def __contains__(self, x):
             return x in self.contents
         def __nonzero__(self):
             "A tag is non-None even if it has no contents."
             return True
         def __setitem__(self, key, value):
             """Setting tag[key] sets the value of the 'key' attribute for the
             tag."""
             self._getAttrMap()
             self.attrMap[key] = value
             found = False
             for i in range(0, len(self.attrs)):
                 if self.attrs[i][0] == key:
                     self.attrs[i] = (key, value)
                     found = True
             if not found:
                 self.attrs.append((key, value))
             self._getAttrMap()[key] = value
         def __delitem__(self, key):
             "Deleting tag[key] deletes all 'key' attributes for the tag."
             for item in self.attrs:
                 if item[0] == key:
                     self.attrs.remove(item)
                     #We don't break because bad HTML can define the same
                     #attribute multiple times.
                 self._getAttrMap()
                 if self.attrMap.has_key(key):
                     del self.attrMap[key]
         def __call__(self, *args, **kwargs):
             """Calling a tag like a function is the same as calling its
             findAll() method. Eg. tag('a') returns a list of all the A tags
             found within this tag."""
             return apply(self.findAll, args, kwargs)
         def __getattr__(self, tag):
             #print "Getattr %s.%s" % (self.__class__, tag)
             if len(tag) > 3 and tag.rfind('Tag') == len(tag)-3:
                 return self.find(tag[:-3])
             elif tag.find('__') != 0:
                 return self.find(tag)
             raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__, tag)
         def __eq__(self, other):
             """Returns true iff this tag has the same name, the same attributes,
             and the same contents (recursively) as the given tag.
             NOTE: right now this will return false if two tags have the
             same attributes in a different order. Should this be fixed?"""
             if other is self:
                 return True
             if not hasattr(other, 'name') or not hasattr(other, 'attrs') or not hasattr(other, 'contents') or self.name != other.name or self.attrs != other.attrs or len(self) != len(other):
                 return False
             for i in range(0, len(self.contents)):
                 if self.contents[i] != other.contents[i]:
                     return False
             return True
         def __ne__(self, other):
             """Returns true iff this tag is not identical to the other tag,
             as defined in __eq__."""
             return not self == other
         def __repr__(self, encoding=DEFAULT_OUTPUT_ENCODING):
             """Renders this tag as a string."""
             return self.__str__(encoding)
         def __unicode__(self):
             return self.__str__(None)
         def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING,
                     prettyPrint=False, indentLevel=0):
             """Returns a string or Unicode representation of this tag and
             its contents. To get Unicode, pass None for encoding.
             NOTE: since Python's HTML parser consumes whitespace, this
             method is not certain to reproduce the whitespace present in
             the original string."""
             encodedName = self.toEncoding(self.name, encoding)
             attrs = []
             if self.attrs:
                 for key, val in self.attrs:
                     fmt = '%s="%s"'
                     if isinstance(val, basestring):
                         if self.containsSubstitutions and '%SOUP-ENCODING%' in val:
                             val = self.substituteEncoding(val, encoding)
                         # The attribute value either:
+                        #
                         # * Contains no embedded double quotes or single quotes.
                         #   No problem: we enclose it in double quotes.
                         # * Contains embedded single quotes. No problem:
                         #   double quotes work here too.
                         # * Contains embedded double quotes. No problem:
                         #   we enclose it in single quotes.
                         # * Embeds both single _and_ double quotes. This
                         #   can't happen naturally, but it can happen if
                         #   you modify an attribute value after parsing
                         #   the document. Now we have a bit of a
                         #   problem. We solve it by enclosing the
                         #   attribute in single quotes, and escaping any
                         #   embedded single quotes to XML entities.
                         if '"' in val:
                             fmt = "%s='%s'"
                             if "'" in val:
                                 # TODO: replace with apos when
                                 # appropriate.
                                 val = val.replace("'", "&squot;")
                         # Now we're okay w/r/t quotes. But the attribute
                         # value might also contain angle brackets, or
                         # ampersands that aren't part of entities. We need
                         # to escape those to XML entities too.
                         val = self.BARE_AMPERSAND_OR_BRACKET.sub(self._sub_entity, val)
                     attrs.append(fmt % (self.toEncoding(key, encoding),
                                         self.toEncoding(val, encoding)))
             close = ''
             closeTag = ''
             if self.isSelfClosing:
                 close = ' /'
             else:
                 closeTag = '</%s>' % encodedName
             indentTag, indentContents = 0, 0
             if prettyPrint:
                 indentTag = indentLevel
                 space = (' ' * (indentTag-1))
                 indentContents = indentTag + 1
             contents = self.renderContents(encoding, prettyPrint, indentContents)
             if self.hidden:
                 s = contents
             else:
                 s = []
                 attributeString = ''
                 if attrs:
                     attributeString = ' ' + ' '.join(attrs)
                 if prettyPrint:
                     s.append(space)
                 s.append('<%s%s%s>' % (encodedName, attributeString, close))
                 if prettyPrint:
                     s.append("\n")
                 s.append(contents)
                 if prettyPrint and contents and contents[-1] != "\n":
                     s.append("\n")
                 if prettyPrint and closeTag:
                     s.append(space)
                 s.append(closeTag)
                 if prettyPrint and closeTag and self.nextSibling:
                     s.append("\n")
                 s = ''.join(s)
             return s
         def decompose(self):
             """Recursively destroys the contents of this tree."""
             self.extract()
             if len(self.contents) == 0:
                 return
             current = self.contents[0]
             while current is not None:
                 next = current.next
                 if isinstance(current, Tag):
                     del current.contents[:]
                 current.parent = None
                 current.previous = None
                 current.previousSibling = None
                 current.next = None
                 current.nextSibling = None
                 current = next
         def prettify(self, encoding=DEFAULT_OUTPUT_ENCODING):
             return self.__str__(encoding, True)
         def renderContents(self, encoding=DEFAULT_OUTPUT_ENCODING,
                            prettyPrint=False, indentLevel=0):
             """Renders the contents of this tag as a string in the given
             encoding. If encoding is None, returns a Unicode string.."""
             s=[]
             for c in self:
                 text = None
                 if isinstance(c, NavigableString):
                     text = c.__str__(encoding)
                 elif isinstance(c, Tag):
                     s.append(c.__str__(encoding, prettyPrint, indentLevel))
                 if text and prettyPrint:
                     text = text.strip()
                 if text:
                     if prettyPrint:
                         s.append(" " * (indentLevel-1))
                     s.append(text)
                     if prettyPrint:
                         s.append("\n")
             return ''.join(s)
         #Soup methods
         def find(self, name=None, attrs={}, recursive=True, text=None,
                  **kwargs):
             """Return only the first child of this Tag matching the given
             criteria."""
             r = None
             l = self.findAll(name, attrs, recursive, text, 1, **kwargs)
             if l:
                 r = l[0]
             return r
         findChild = find
         def findAll(self, name=None, attrs={}, recursive=True, text=None,
                     limit=None, **kwargs):
             """Extracts a list of Tag objects that match the given
             criteria.  You can specify the name of the Tag and any
             attributes you want the Tag to have.
             The value of a key-value pair in the 'attrs' map can be a
             string, a list of strings, a regular expression object, or a
             callable that takes a string and returns whether or not the
             string matches for some custom definition of 'matches'. The
             same is true of the tag name."""
             generator = self.recursiveChildGenerator
             if not recursive:
                 generator = self.childGenerator
             return self._findAll(name, attrs, text, limit, generator, **kwargs)
         findChildren = findAll
         # Pre-3.x compatibility methods
         first = find
         fetch = findAll
         def fetchText(self, text=None, recursive=True, limit=None):
             return self.findAll(text=text, recursive=recursive, limit=limit)
         def firstText(self, text=None, recursive=True):
             return self.find(text=text, recursive=recursive)
         #Private methods
         def _getAttrMap(self):
             """Initializes a map representation of this tag's attributes,
             if not already initialized."""
             if not getattr(self, 'attrMap'):
                 self.attrMap = {}
                 for (key, value) in self.attrs:
                     self.attrMap[key] = value
             return self.attrMap
         #Generator methods
         def childGenerator(self):
             # Just use the iterator from the contents
             return iter(self.contents)
         def recursiveChildGenerator(self):
             if not len(self.contents):
                 raise StopIteration
             stopNode = self._lastRecursiveChild().next
             current = self.contents[0]
             while current is not stopNode:
                 yield current
                 current = current.next
     # Next, a couple classes to represent queries and their results.
     class SoupStrainer:
         """Encapsulates a number of ways of matching a markup element (tag or
         text)."""
         def __init__(self, name=None, attrs={}, text=None, **kwargs):
             self.name = name
             if isinstance(attrs, basestring):
                 kwargs['class'] = _match_css_class(attrs)
                 attrs = None
             if kwargs:
                 if attrs:
                     attrs = attrs.copy()
                     attrs.update(kwargs)
                 else:
                     attrs = kwargs
             self.attrs = attrs
             self.text = text
         def __str__(self):
             if self.text:
                 return self.text
             else:
                 return "%s|%s" % (self.name, self.attrs)
         def searchTag(self, markupName=None, markupAttrs={}):
             found = None
             markup = None
             if isinstance(markupName, Tag):
                 markup = markupName
                 markupAttrs = markup
             callFunctionWithTagData = callable(self.name) \
                                     and not isinstance(markupName, Tag)
             if (not self.name) \
                    or callFunctionWithTagData \
                    or (markup and self._matches(markup, self.name)) \
                    or (not markup and self._matches(markupName, self.name)):
                 if callFunctionWithTagData:
                     match = self.name(markupName, markupAttrs)
                 else:
                     match = True
                     markupAttrMap = None
                     for attr, matchAgainst in self.attrs.items():
                         if not markupAttrMap:
                              if hasattr(markupAttrs, 'get'):
                                 markupAttrMap = markupAttrs
                              else:
                                 markupAttrMap = {}
                                 for k,v in markupAttrs:
                                     markupAttrMap[k] = v
                         attrValue = markupAttrMap.get(attr)
                         if not self._matches(attrValue, matchAgainst):
                             match = False
                             break
                 if match:
                     if markup:
                         found = markup
                     else:
                         found = markupName
             return found
         def search(self, markup):
             #print 'looking for %s in %s' % (self, markup)
             found = None
             # If given a list of items, scan it for a text element that
             # matches.
             if hasattr(markup, "__iter__") \
                     and not isinstance(markup, Tag):
                 for element in markup:
                     if isinstance(element, NavigableString) \
                            and self.search(element):
                         found = element
                         break
             # If it's a Tag, make sure its name or attributes match.
             # Don't bother with Tags if we're searching for text.
             elif isinstance(markup, Tag):
                 if not self.text:
                     found = self.searchTag(markup)
             # If it's text, make sure the text matches.
             elif isinstance(markup, NavigableString) or \
                      isinstance(markup, basestring):
                 if self._matches(markup, self.text):
                     found = markup
             else:
                 raise Exception, "I don't know how to match against a %s" \
                       % markup.__class__
             return found
         def _matches(self, markup, matchAgainst):
             #print "Matching %s against %s" % (markup, matchAgainst)
             result = False
             if matchAgainst is True:
                 result = markup is not None
             elif callable(matchAgainst):
                 result = matchAgainst(markup)
             else:
                 #Custom match methods take the tag as an argument, but all
                 #other ways of matching match the tag name as a string.
                 if isinstance(markup, Tag):
                     markup = markup.name
                 if markup and not isinstance(markup, basestring):
                     markup = unicode(markup)
                 #Now we know that chunk is either a string, or None.
                 if hasattr(matchAgainst, 'match'):
                     # It's a regexp object.
                     result = markup and matchAgainst.search(markup)
                 elif hasattr(matchAgainst, '__iter__'): # list-like
                     result = markup in matchAgainst
                 elif hasattr(matchAgainst, 'items'):
                     result = markup.has_key(matchAgainst)
                 elif matchAgainst and isinstance(markup, basestring):
                     if isinstance(markup, unicode):
                         matchAgainst = unicode(matchAgainst)
                     else:
                         matchAgainst = str(matchAgainst)
                 if not result:
                     result = matchAgainst == markup
             return result
     class ResultSet(list):
         """A ResultSet is just a list that keeps track of the SoupStrainer
         that created it."""
         def __init__(self, source):
             list.__init__([])
             self.source = source
     # Now, some helper functions.
     def buildTagMap(default, *args):
         """Turns a list of maps, lists, or scalars into a single map.
         Used to build the SELF_CLOSING_TAGS, NESTABLE_TAGS, and
         NESTING_RESET_TAGS maps out of lists and partial maps."""
         built = {}
         for portion in args:
             if hasattr(portion, 'items'):
                 #It's a map. Merge it.
                 for k,v in portion.items():
                     built[k] = v
             elif hasattr(portion, '__iter__'): # is a list
                 #It's a list. Map each item to the default.
                 for k in portion:
                     built[k] = default
             else:
                 #It's a scalar. Map it to the default.
                 built[portion] = default
         return built
     # Now, the parser classes.
     class BeautifulStoneSoup(Tag, SGMLParser):
         """This class contains the basic parser and search code. It defines
         a parser that knows nothing about tag behavior except for the
         following:
           You can't close a tag without closing all the tags it encloses.
           That is, "<foo><bar></foo>" actually means
           "<foo><bar></bar></foo>".
         [Another possible explanation is "<foo><bar /></foo>", but since
         this class defines no SELF_CLOSING_TAGS, it will never use that
         explanation.]
         This class is useful for parsing XML or made-up markup languages,
         or when BeautifulSoup makes an assumption counter to what you were
         expecting."""
         SELF_CLOSING_TAGS = {}
         NESTABLE_TAGS = {}
         RESET_NESTING_TAGS = {}
         QUOTE_TAGS = {}
         PRESERVE_WHITESPACE_TAGS = []
         MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'),
                            lambda x: x.group(1) + ' />'),
                           (re.compile('<!\s+([^<>]*)>'),
                            lambda x: '<!' + x.group(1) + '>')
+                          ]
         ROOT_TAG_NAME = u'[document]'
         HTML_ENTITIES = "html"
         XML_ENTITIES = "xml"
         XHTML_ENTITIES = "xhtml"
         # TODO: This only exists for backwards-compatibility
         ALL_ENTITIES = XHTML_ENTITIES
         # Used when determining whether a text node is all whitespace and
         # can be replaced with a single space. A text node that contains
         # fancy Unicode spaces (usually non-breaking) should be left
         # alone.
         STRIP_ASCII_SPACES = { 9: None, 10: None, 12: None, 13: None, 32: None, }

... This diff was truncated because it exceeds the maximum size that can be displayed.

Also available in: Unified diff

Application: gvSIG desktop » gvSIG scripting

Revision 548