git.fiddlerwoaroof.com
ts-sexp.py
286e4ed1
 # Copyright (c) 2019 Edward Langley
 # All rights reserved.
 #
 # Redistribution and use in source and binary forms, with or without
 # modification, are permitted provided that the following conditions
 # are met:
 #
 # Redistributions of source code must retain the above copyright notice,
 # this list of conditions and the following disclaimer.
 #
 # Redistributions in binary form must reproduce the above copyright
 # notice, this list of conditions and the following disclaimer in the
 # documentation and/or other materials provided with the distribution.
 #
 # Neither the name of the project's author nor the names of its
 # contributors may be used to endorse or promote products derived from
 # this software without specific prior written permission.
 #
 # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 # "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 # LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
 # FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 # HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 # SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
 # TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
 # PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
 # LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
 # NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
 # SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 
 import tree_sitter as t
 
 t.Language.build_library('ts.so', [
     'tree-sitter-javascript',
     'tree-sitter-scala',
     'tree-sitter-java',
     'tree-sitter-kotlin'
 ])
 
 def listify(text, cursor, level=1):
     node = cursor.node
     result = []
 
     print('  '*level, '>', node.type, node.start_byte, node.end_byte)
 
     result.append(node.type)
 
     if cursor.goto_first_child():
         result.append(listify(text, cursor, level+1))
         cursor.goto_parent()
     else:
         result.append(text[node.start_byte:node.end_byte].decode('utf-8'))
 
     while cursor.goto_next_sibling():
         result.append(listify(text, cursor, level+1))
 
     print('  '*level, '<', node.type, node.start_byte, node.end_byte)
 
     return result
 
 
 
 java = t.Language('ts.so', 'java')
 parser = t.Parser(java)
 parser.set_language(java)
 
 text = open('/java/file.java', 'rb').read()