git.fiddlerwoaroof.com
Raw Blame History
# Copyright (c) 2019 Edward Langley
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
#
# Redistributions of source code must retain the above copyright notice,
# this list of conditions and the following disclaimer.
#
# Redistributions in binary form must reproduce the above copyright
# notice, this list of conditions and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
#
# Neither the name of the project's author nor the names of its
# contributors may be used to endorse or promote products derived from
# this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
# HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
# SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
# TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
# PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
# LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
# NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
# SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

import tree_sitter as t

t.Language.build_library('ts.so', [
    'tree-sitter-javascript',
    'tree-sitter-scala',
    'tree-sitter-java',
    'tree-sitter-kotlin'
])

def listify(text, cursor, level=1):
    node = cursor.node
    result = []

    print('  '*level, '>', node.type, node.start_byte, node.end_byte)

    result.append(node.type)

    if cursor.goto_first_child():
        result.append(listify(text, cursor, level+1))
        cursor.goto_parent()
    else:
        result.append(text[node.start_byte:node.end_byte].decode('utf-8'))

    while cursor.goto_next_sibling():
        result.append(listify(text, cursor, level+1))

    print('  '*level, '<', node.type, node.start_byte, node.end_byte)

    return result



java = t.Language('ts.so', 'java')
parser = t.Parser(java)
parser.set_language(java)

text = open('/java/file.java', 'rb').read()