UnrealEngineSDK-Demo/_dlg_twine_to_json_human_text_8py_source.html

#!/usr/bin/env python3

# Copyright 2017-2018 Csaba Molnar, Daniel Butum


import os

import sys

import argparse

import json

import uuid

import re

from pprint import pprint


from html.parser import HTMLParser

from html.entities import name2codepoint


# NOTE: This script is standalone does not include any libraries


DLG_JSON_HUMAN_EXTENSION = ".dlg_human.json"

ROOT_NODE_INDEX = -1


class Colors:

    HEADER = '\033[95m'


    BLUE = '\033[0;36m'

    BLUE_LIGHT = '\033[1;36m'


    GREEN = '\033[0;32m'

    GREEN_LIGHT = '\033[1;32m'


    YELLOW = '\033[0;33m'

    YELLOW_LIGHT = '\033[1;33m'


    RED = '\033[0;31m'

    RED_LIGHT = '\033[1;31m'


    # No Color

    END = '\033[0m'


def print_newlines(nr = 1):

    if nr > 0:

        print('\n' * nr, end='')


def print_reset_color():

    if sys.stdout.isatty():

        print(Colors.END)


def _print_internal(color, string, **kwargs):

    if sys.stdout.isatty():

        # You're running in a real terminal

        prefix, suffix = color, Colors.END

    else:

        # You're being piped or redirected

        prefix, suffix = '', ''


    print(prefix + string + suffix, **kwargs)


def print_red(*args, **kwargs):

    _print_internal(Colors.RED, " ".join(map(str, args)), **kwargs)


def print_red_light(*args, **kwargs):

    _print_internal(Colors.RED_LIGHT, " ".join(map(str, args)), **kwargs)


def print_blue(*args, **kwargs):

    _print_internal(Colors.BLUE, " ".join(map(str, args)), **kwargs)


def print_blue_light(*args, **kwargs):

    _print_internal(Colors.BLUE_LIGHT, " ".join(map(str, args)), **kwargs)


def print_yellow(*args, **kwargs):

    _print_internal(Colors.YELLOW, " ".join(map(str, args)), **kwargs)


def print_yellow_light(*args, **kwargs):

    _print_internal(Colors.YELLOW_LIGHT, " ".join(map(str, args)), **kwargs)


def print_green(*args, **kwargs):

    _print_internal(Colors.GREEN, " ".join(map(str, args)), **kwargs)


def print_green_light(*args, **kwargs):

    _print_internal(Colors.GREEN_LIGHT, " ".join(map(str, args)), **kwargs)


def print_config_value(config_name, config_value):

    print_blue("{} = ".format(config_name), end='')

    print_blue_light(config_value)


def string_to_int(string):

    try:

        return int(string)

    except ValueError:

        return None


class TwineNodeTag:

    NODE_START = "node-start"

    NODE_END = "node-end"

    NODE_VIRTUAL_PARENT = "node-virtual-parent"

    NODE_SPEECH = "node-speech"

    NODE_SPEECH_SEQUENCE = "node-speech-sequence"

    NODE_SELECTOR_FIRST = "node-selector-first"

    NODE_SELECTOR_RANDOM = "node-selector-random"


    @classmethod


    def get_all_tags(cls):

        return set([cls.NODE_STARTNODE_START, cls.NODE_ENDNODE_END, cls.NODE_VIRTUAL_PARENTNODE_VIRTUAL_PARENT, cls.NODE_SPEECHNODE_SPEECH, cls.NODE_SPEECH_SEQUENCENODE_SPEECH_SEQUENCE, cls.NODE_SELECTOR_FIRSTNODE_SELECTOR_FIRST, cls.NODE_SELECTOR_RANDOM])


    @classmethod


    def is_valid_tag(cls, tag):

        return tag.lower() in cls.get_all_tags()


    @classmethod


    def has_valid_tags(cls, tags_list):

        tags_set = set([x.lower() for x in tags_list])

        common = cls.get_all_tags().intersection(tags_set)

        return bool(common)


class TwineHelper:

    REGEX_NAME = r"(-?\d+)\.\s*(.*)"


    @classmethod


    def parse_twine_node_name(cls, raw_name, context_multiple_matches, context_invalid_index, context_invalid_speaker):

        # Get node index and speaker

        matches_name = re.finditer(cls.REGEX_NAME, raw_name, re.MULTILINE | re.UNICODE)

        node_index, speaker = None, None

        for index, match in enumerate(matches_name):

            if index > 0:

                print_yellow("{}, got multiple name matches".format(context_multiple_matches))

                break


            group_index = match.group(1)

            if group_index is not None:

                node_index = string_to_int(group_index.strip())

            else:

                print_yellow("{}, could not get node index from <node index>. <Speaker>".format(context_invalid_index))


            group_speaker = match.group(2)

            if group_index is not None:

                speaker = group_speaker.strip()

            else:

                print_yellow("{}, could not get speaker from <node index>. <Speaker>".format(context_invalid_speaker))


        return node_index, speaker


    @classmethod


    def clean_text(cls, text):

        # Use windows line endings

        return text.strip().replace("\n", "\r\n")


class TwineEdgeData:

    IGNORE_EMPTY_TEXT_FLAG = "~ignore~"


    def __init__(self):

        self.raw_data = None

        self.raw_text = None


        self.text = None

        self.target_node_index = None

        self.owner_node_index = None


    # The edge has empty text


    def is_empty_edge_text(self):

        return self.raw_text is None or self.IGNORE_EMPTY_TEXT_FLAG in self.raw_text.lower()


    def parse(self):

        # TODO make sure there are not multiple of these

        parts = self.raw_data.split("|")

        if len(parts) != 2:

            print_yellow("Node Index = {} has an edge with len(parts) = {}. There must be exactly 2. Did you use `|` inside your edge?".format(self.owner_node_index, len(parts)))

            return


        # Text

        self.raw_text = parts[0]

        if self.is_empty_edge_text():

            self.text = ""

        else:

            self.text = TwineHelper.clean_text(self.raw_text)


        # Target nnode index

        context_parse_name = "Node Index = {} Edge, parts[1] = `{}`".format(self.owner_node_index, parts[1])

        self.target_node_index, ignored_speaker = TwineHelper.parse_twine_node_name(parts[1], context_parse_name, context_parse_name, context_parse_name)


    def to_dict(self):

        if self.text is None or self.target_node_index is None or self.target_node_index < ROOT_NODE_INDEX:

            print(self.text)

            print_yellow("Node index = {}, Edge invalid = {}. ignoring.".format(self.owner_node_index, str(self)))

            return {}


        return {

            "TargetNodeIndex": self.target_node_index,

            "Text": self.text

        }


    def __str__(self):

        return "TwineEdgeData(target_node_index = {}, text = `{}`)".format(self.target_node_index, self.text)


    def __repr__(self):

        return str(self)


class TwineInnerEdgeData:

    REGEX_SPEAKER = r"``\s*Speaker\s*:\s*``\s*//(.*)//"

    REGEX_TEXT = r"``\s*Text\s*:\s*``\s*//(.*)//"

    REGEX_EDGE_TEXT = r"``\s*EdgeText\s*:\s*``\s*//(.*)//"


    def __init__(self):

        self.raw_data = None


        self.speaker = None

        self.text = None

        self.edge_text = None

        self.owner_node_index = None


    def parse(self):

        # Parse speaker

        matches_text = re.finditer(self.REGEX_SPEAKER, self.raw_data, re.MULTILINE | re.UNICODE | re.IGNORECASE)

        for index, match in enumerate(matches_text):

            if index > 0:

                print_yellow("Node speech sequence Index = {} got multiple matches for Speaker".format(self.owner_node_index))

                break


            group = match.group(1)

            if group is None:

                print_yellow("Node speech sequence Index = {} could not get group 1 that matches ``Speaker:`` //<Name>//".format(self.owner_node_index))

                continue


            self.speaker = group.strip()


        # Parse text

        matches_text = re.finditer(self.REGEX_TEXT, self.raw_data, re.MULTILINE | re.UNICODE | re.IGNORECASE)

        for index, match in enumerate(matches_text):

            if index > 0:

                print_yellow("Node speech sequence Index = {} got multiple matches for Text".format(self.owner_node_index))

                break


            group = match.group(1)

            if group is None:

                print_yellow("Node speech sequence Index = {} could not get group 1 that matches ``Text:`` //<text>//".format(self.owner_node_index))

                continue


            self.text = TwineHelper.clean_text(group.strip())


        # Parse edge text

        matches_edge_text = re.finditer(self.REGEX_EDGE_TEXT, self.raw_data, re.MULTILINE | re.UNICODE | re.IGNORECASE)

        for index, match in enumerate(matches_edge_text):

            if index > 0:

                print_yellow("Node speech sequence Index = {} got multiple matches for edge text".format(self.owner_node_index))

                break


            group = match.group(1)

            if group is None:

                print_yellow("Node speech sequence Index = {} could not get group 1 that matches ``EdgeText:`` //<edge_text>//".format(self.owner_node_index))

                continue

            self.edge_text = group.strip()


    def to_dict(self):

        if self.speaker is None or self.raw_data is None or self.text is None or self.edge_text is None:

            return {}


        return {

            "Speaker": self.speaker,

            "Text": self.text,

            "EdgeText": self.edge_text

        }


    def __str__(self):

        return "TwineInnerEdgeData(speaker = {}, text = {}, edge_text = `{}`)".format(self.speaker, self.text, self.edge_text)


    def __repr__(self):

        return str(self)


class TwineNodeData:

    REGEX_EDGES = r"\[\[(.*)\]\]"


    def __init__(self):

        self.raw_name = None

        self.raw_data = None

        self.raw_tags = None


        # Computed from raw data

        self.node_index = None

        self.speaker = None

        self.text = ""

        self.tags = []

        self.edges = []

        self.inner_edges = []


    def __get_raw_data_until_edges(self):

        index_edge_start = self.raw_data.find("[[")

        if index_edge_start == -1:

            # take whole string

            return self.raw_data


        # Until the first

        return self.raw_data[0:index_edge_start]


    def _parse_text(self):

        if not self.can_have_text():

            return


        self.text = TwineHelper.clean_text(self.__get_raw_data_until_edges())


    def _parse_edges(self):

        # Refuse to parse, because on some nodes we don't care about the edge text

        if not self.raw_data or not self.can_have_text_on_edges():

            return None


        matches = re.finditer(self.REGEX_EDGES, self.raw_data, re.MULTILINE | re.UNICODE)

        for index, match in enumerate(matches):

            group = match.group(1)

            if group is None:

                print_yellow("Node Index = {} could not get group 1 that matches [[<edge content>|<edge index>]]".format(self.node_index))

                continue


            edge = TwineEdgeData()

            edge.raw_data = group.strip()

            edge.owner_node_index = self.node_index

            edge.parse()

            self.edges.append(edge)


    # only for speech sequence nodese


    def _parse_inner_edges(self):

        if not self.is_node_speech_sequence() or not self.raw_data:

            return


        raw_text_data = self.__get_raw_data_until_edges().strip()

        inner_edges_parts = raw_text_data.split("---")

        if not inner_edges_parts:

            print_yellow("Node Index = {} which is a speech sequence node does not have inner edges".format(self.node_index))

            return


        for raw_inner_edge in inner_edges_parts:

            inner_edge = TwineInnerEdgeData()

            inner_edge.raw_data = raw_inner_edge.strip()

            inner_edge.owner_node_index = self.node_index

            inner_edge.parse()

            self.inner_edges.append(inner_edge)


    def parse(self):

        self.tags = [x.lower() for x in  self.raw_tags.strip().split(" ")]


        # Get node index and speaker

        context_parse_name = "Node Name = {}".format(self.raw_name)

        self.node_index, self.speaker = TwineHelper.parse_twine_node_name(self.raw_name, context_parse_name, context_parse_name, context_parse_name)


        self._parse_text()

        if not TwineNodeTag.has_valid_tags(self.tags):

            print_yellow("Node Index = {} does not have any valid tags = {}".format(self.node_index, self.tags))


        self._parse_edges()

        self._parse_inner_edges()


    def can_have_text(self):

        return self.is_node_speech() or self.is_node_virtual_parent()


    def can_have_text_on_edges(self):

        return self.is_node_start() or self.is_node_speech() or self.is_node_speech_sequence()


    def is_node_start(self):

        return TwineNodeTag.NODE_START in self.tags


    def is_node_end(self):

        return TwineNodeTag.NODE_END in self.tags


    def is_node_speech(self):

        return TwineNodeTag.NODE_SPEECH in self.tags


    def is_node_virtual_parent(self):

        return TwineNodeTag.NODE_VIRTUAL_PARENT in self.tags


    def is_node_speech_sequence(self):

        return TwineNodeTag.NODE_SPEECH_SEQUENCE in self.tags


    def is_node_selector(self):

        return self.is_node_selector_first() or self.is_node_selector_random()


    def is_node_selector_first(self):

        return TwineNodeTag.NODE_SELECTOR_FIRST in self.tags


    def is_node_selector_random(self):

        return TwineNodeTag.NODE_SELECTOR_RANDOM in self.tags


    def to_dict(self):

        if self.node_index is None or self.node_index < ROOT_NODE_INDEX:

            print_yellow("Node Index = {} is invalid ignoring".format(self.node_index))

            return {}


        edges = []

        for edge in self.edges:

            edges.append(edge.to_dict())


        inner_edges = []

        for inner_edge in self.inner_edges:

            inner_edges.append(inner_edge.to_dict())


        if self.is_node_speech_sequence():

            return {

                "NodeIndex": self.node_index,

                "Speaker": self.speaker,

                "Sequence": inner_edges,

                "Edges": edges

            }


        if self.can_have_text() or self.is_node_start():

            return {

                "NodeIndex": self.node_index,

                "Speaker": self.speaker,

                "Text": self.text,

                "Edges": edges

            }


        return {}


    def __str__(self):

        return "TwineNodeData(node_index = {}, speakr = {},  tags = {}, text = `{}`, edges = {})".format(self.node_index, self.speaker, self.tags, self.text, self.edges)


    def __repr__(self):

        return str(self)


class TwineDocumentData:


    def __init__(self):

        self.raw_guid = None


        self.dialogue_name = None

        self.dialogue_guid = None

        self.nodes = []


    def _parse_dialogue_guid(self):

        # Convert to default Unreal uuid

        temp_uuid = uuid.UUID(self.raw_guid)

        self.dialogue_guid = temp_uuid.hex.upper()


    def parse(self):

        self._parse_dialogue_guid()


    def to_dict(self):

        if self.dialogue_name is None or self.dialogue_guid is None or not self.nodes:

            return {}


        speech_nodes = []

        speech_sequence_nodes = []

        for node in self.nodes:

            if node.is_node_speech_sequence():

                speech_sequence_nodes.append(node.to_dict())

            elif node.is_node_speech() or node.is_node_virtual_parent() or node.is_node_start():

                speech_nodes.append(node.to_dict())

            else:

                # Ignore

                pass


        return {

            "DialogueName": self.dialogue_name,

            "DialogueGUID": self.dialogue_guid,

            "SpeechNodes": speech_nodes,

            "SpeechSequenceNodes": speech_sequence_nodes

        }


    def __str__(self):

        return "TwineDocumentData(dialogue_name = {}, dialogue_guid = {}, nodes =\n{})".format(self.dialogue_name, self.dialogue_guid, "\n".join(str(n) for n in self.nodes))


    def __repr__(self):

        return str(self)


class TwineHtmlParser(HTMLParser):

    HTML_TAG_STORYDATA = "tw-storydata"

    HTML_TAG_PASSAGE_DATA = "tw-passagedata"


    HTML_ATTR_NAME = "name"

    HTML_ATTR_TAGS = "tags"

    HTML_ATTR_GUID = "ifid"


    def __init__(self):

        super().__init__()

        self.document = TwineDocumentData()

        self.current_tag = None

        self.current_node = None


    def handle_starttag(self, tag, attrs):

        # print("Start tag:", tag)

        self.current_tag = tag

        if tag == self.HTML_TAG_STORYDATA:

            # Data about dialogue

            for attr in attrs:

                attr_name, attr_value = attr

                if attr_name == self.HTML_ATTR_NAME:

                    self.document.dialogue_name = attr_value.strip()

                elif attr_name == self.HTML_ATTR_GUID:

                    self.document.raw_guid = attr_value.strip()


        elif tag == self.HTML_TAG_PASSAGE_DATA:

            # Data about each node

            self.current_node = TwineNodeData()

            self.document.nodes.append(self.current_node)


            for attr in attrs:

                attr_name, attr_value = attr

                if attr_name == self.HTML_ATTR_NAME:

                    self.current_node.raw_name = attr_value.strip()

                elif attr_name == self.HTML_ATTR_TAGS:

                    self.current_node.raw_tags = attr_value.strip()


    def handle_endtag(self, tag):

        if tag == self.HTML_TAG_STORYDATA:

            self.document.parse()

        elif tag == self.HTML_TAG_PASSAGE_DATA:

            self.current_node.parse()


        self.current_tag = None

        self.current_node = None

        # print("End tag  :", tag)


    def handle_data(self, data):

        if self.current_tag is None:

            return

        if self.current_node is None:

            return


        if self.current_tag == self.HTML_TAG_PASSAGE_DATA:

            self.current_node.raw_data = data.strip()


    def handle_comment(self, data):

        print("Comment  :", data)


    def handle_entityref(self, name):

        c = chr(name2codepoint[name])

        print("Named ent:", c)


    def handle_charref(self, name):

        if name.startswith('x'):

            c = chr(int(name[1:], 16))

        else:

            c = chr(int(name))

        print("Num ent  :", c)


    def handle_decl(self, data):

        print("Decl     :", data)


def exit_program(status):

    sys.exit(status)


def exit_program_error(message=None):

    if message is not None:

        print_red(message)

    exit_program(1)


def exit_program_success():

    exit_program(0)


def convert_path_to_absolute_if_not_already(path):

    if not os.path.isabs(path):

        return os.path.abspath(path)


    return path


def is_path_twine_file(path):

    if not os.path.isfile(path):

        return False


    filename = os.path.basename(str(path))

    file, extension = os.path.splitext(filename)


    if extension != ".html":

        return False


    # TODO Maybe parse the contents


    return True


def json_save_dictionary(path, dictionary):

    try:

        with open(path, 'w') as fh:

            try:

                json.dump(dictionary, fh, indent=4)

            except ValueError as e:

                print_red("Can't save file = `{}`. Error = `{}`".format(path, e))

                return None

    except IOError as e:

        print_red("Can't open file = `{}`. IOError = `{}`".format(path, e))


def twine_parse_file(path):

    """

    Returns a dictionary

    """

    try:

        with open(path, 'r', encoding="utf8") as fh:

            parser = TwineHtmlParser()

            parser.feed(fh.read())

            return parser.document

    except IOError as e:

        print_red("Can't open file = `{}`. IOError = `{}`".format(path, e))

        return None


def export_twine_file_dlg_text_json(src_file_path, src_twine_dir_from, dst_json_dir):

    # Construct subdirectory we need to create our destination file

    src_dirname, src_filename = os.path.split(src_file_path)


    src_dirname_parts = src_dirname.split(os.sep)

    dst_dirname = None

    for index, part in enumerate(src_dirname_parts):

        if part == src_twine_dir_from:

            dst_dirname = os.sep.join(src_dirname_parts[index + 1:])

            break


    if dst_dirname is None:

        print_yellow("Can't find dst_dirname for src_file_path = `{}`".format(src_file_path))

        return


    # Ensure dirname exists in destination

    dst_dirname = os.path.join(dst_json_dir, dst_dirname)

    if not os.path.exists(dst_dirname):

        os.makedirs(dst_dirname, exist_ok=True)

        print_blue("Creating directory = `{}`".format(dst_dirname))

    if not os.path.isdir(dst_json_dir):

        print_yellow("Path = `{}` is not a directory. Ignoring".format(dst_dirname))

        return


    # Parse file

    print_blue("Parsing file = `{}`".format(src_file_path))

    twine_document =  twine_parse_file(src_file_path)

    if twine_document is None:

        print_yellow("Can't parse twine file = `{}`".format(src_file_path))

        return


    #print(twine_document)

    #print(twine_document.to_dict())


    json_human_content = twine_document.to_dict()

    if not json_human_content:

        print_yellow("Twine file = `{}` is corrupt or invalid. Can't parse any data".format(src_file_path))

        return


    # Write  file

    src_file, src_file_ext = os.path.splitext(src_filename)

    dst_file_path = os.path.join(dst_dirname, src_file) + DLG_JSON_HUMAN_EXTENSION

    print_blue("Writing file = `{}`".format(dst_file_path))

    json_save_dictionary(dst_file_path, json_human_content)

    print("")


def main(src_twine_dir, dst_json_dir):

    if not os.path.exists(src_twine_dir):

        exit_program_error("src_twine_dir = `{}` does not exist".format(src_twine_dir))

    if not os.path.isdir(src_twine_dir):

        exit_program_error("src_twine_dir = `{}` is not a directory".format(src_twine_dir))


    if not os.path.exists(dst_json_dir):

        os.makedirs(dst_json_dir, exist_ok=True)

        print_blue("Creating dst_json_dir = `{}`".format(dst_json_dir))

    if not os.path.isdir(dst_json_dir):

        exit_program_error("dst_json_dir = `{}` is not a directory".format(dst_json_dir))


    # Walk over all files in directory

    src_twine_dir = convert_path_to_absolute_if_not_already(src_twine_dir)

    dst_json_dir = convert_path_to_absolute_if_not_already(dst_json_dir)

    print_blue("Finding save files in src_twine_dir = {}\n".format(src_twine_dir))


    # Directory from where files

    src_twine_dir_from = os.path.basename(os.path.normpath(src_twine_dir))

    for path, subdirs, files in os.walk(src_twine_dir):

        for name in files:

            full_filename = os.path.join(path, name)

            if is_path_twine_file(full_filename):

                export_twine_file_dlg_text_json(full_filename, src_twine_dir_from, dst_json_dir)

            else:

                print_yellow("Path = `{}` is not a file or a twine file".format(full_filename))


if __name__ == "__main__":

    parser = argparse.ArgumentParser()

    parser.add_argument('src_twine_dir', nargs='?', type=str, help='Source directory from where we get all the .html twine files', default="DialoguesTwine/")

    parser.add_argument('dst_json_dir', nargs='?', type=str, help='Destination directory where we store all the .dlg_human.json files',  default="DialoguesJsonHumanText/")


    args = parser.parse_args()

    main(args.src_twine_dir, args.dst_json_dir)

DlgTwineToJsonHumanText.Colors
Definition DlgTwineToJsonHumanText.py:21

DlgTwineToJsonHumanText.TwineDocumentData
Definition DlgTwineToJsonHumanText.py:436

DlgTwineToJsonHumanText.TwineDocumentData.to_dict
to_dict(self)
Definition DlgTwineToJsonHumanText.py:452

DlgTwineToJsonHumanText.TwineDocumentData.__str__
__str__(self)
Definition DlgTwineToJsonHumanText.py:474

DlgTwineToJsonHumanText.TwineDocumentData.__init__
__init__(self)
Definition DlgTwineToJsonHumanText.py:437

DlgTwineToJsonHumanText.TwineDocumentData._parse_dialogue_guid
_parse_dialogue_guid(self)
Definition DlgTwineToJsonHumanText.py:444

DlgTwineToJsonHumanText.TwineDocumentData.dialogue_guid
dialogue_guid
Definition DlgTwineToJsonHumanText.py:441

DlgTwineToJsonHumanText.TwineDocumentData.dialogue_name
dialogue_name
Definition DlgTwineToJsonHumanText.py:440

DlgTwineToJsonHumanText.TwineDocumentData.__repr__
__repr__(self)
Definition DlgTwineToJsonHumanText.py:477

DlgTwineToJsonHumanText.TwineDocumentData.nodes
nodes
Definition DlgTwineToJsonHumanText.py:442

DlgTwineToJsonHumanText.TwineDocumentData.raw_guid
raw_guid
Definition DlgTwineToJsonHumanText.py:438

DlgTwineToJsonHumanText.TwineDocumentData.parse
parse(self)
Definition DlgTwineToJsonHumanText.py:449

DlgTwineToJsonHumanText.TwineEdgeData
Definition DlgTwineToJsonHumanText.py:162

DlgTwineToJsonHumanText.TwineEdgeData.target_node_index
target_node_index
Definition DlgTwineToJsonHumanText.py:170

DlgTwineToJsonHumanText.TwineEdgeData.parse
parse(self)
Definition DlgTwineToJsonHumanText.py:177

DlgTwineToJsonHumanText.TwineEdgeData.__init__
__init__(self)
Definition DlgTwineToJsonHumanText.py:165

DlgTwineToJsonHumanText.TwineEdgeData.__repr__
__repr__(self)
Definition DlgTwineToJsonHumanText.py:210

DlgTwineToJsonHumanText.TwineEdgeData.text
text
Definition DlgTwineToJsonHumanText.py:169

DlgTwineToJsonHumanText.TwineEdgeData.raw_text
raw_text
Definition DlgTwineToJsonHumanText.py:167

DlgTwineToJsonHumanText.TwineEdgeData.__str__
__str__(self)
Definition DlgTwineToJsonHumanText.py:207

DlgTwineToJsonHumanText.TwineEdgeData.owner_node_index
owner_node_index
Definition DlgTwineToJsonHumanText.py:171

DlgTwineToJsonHumanText.TwineEdgeData.to_dict
to_dict(self)
Definition DlgTwineToJsonHumanText.py:196

DlgTwineToJsonHumanText.TwineEdgeData.raw_data
raw_data
Definition DlgTwineToJsonHumanText.py:166

DlgTwineToJsonHumanText.TwineEdgeData.IGNORE_EMPTY_TEXT_FLAG
str IGNORE_EMPTY_TEXT_FLAG
Definition DlgTwineToJsonHumanText.py:163

DlgTwineToJsonHumanText.TwineEdgeData.is_empty_edge_text
is_empty_edge_text(self)
Definition DlgTwineToJsonHumanText.py:174

DlgTwineToJsonHumanText.TwineHelper
Definition DlgTwineToJsonHumanText.py:129

DlgTwineToJsonHumanText.TwineHelper.clean_text
clean_text(cls, text)
Definition DlgTwineToJsonHumanText.py:157

DlgTwineToJsonHumanText.TwineHelper.parse_twine_node_name
parse_twine_node_name(cls, raw_name, context_multiple_matches, context_invalid_index, context_invalid_speaker)
Definition DlgTwineToJsonHumanText.py:133

DlgTwineToJsonHumanText.TwineHelper.REGEX_NAME
str REGEX_NAME
Definition DlgTwineToJsonHumanText.py:130

DlgTwineToJsonHumanText.TwineHtmlParser
Definition DlgTwineToJsonHumanText.py:481

DlgTwineToJsonHumanText.TwineHtmlParser.document
document
Definition DlgTwineToJsonHumanText.py:491

DlgTwineToJsonHumanText.TwineHtmlParser.__init__
__init__(self)
Definition DlgTwineToJsonHumanText.py:489

DlgTwineToJsonHumanText.TwineHtmlParser.HTML_ATTR_TAGS
str HTML_ATTR_TAGS
Definition DlgTwineToJsonHumanText.py:486

DlgTwineToJsonHumanText.TwineHtmlParser.HTML_TAG_PASSAGE_DATA
str HTML_TAG_PASSAGE_DATA
Definition DlgTwineToJsonHumanText.py:483

DlgTwineToJsonHumanText.TwineHtmlParser.handle_comment
handle_comment(self, data)
Definition DlgTwineToJsonHumanText.py:538

DlgTwineToJsonHumanText.TwineHtmlParser.current_node
current_node
Definition DlgTwineToJsonHumanText.py:493

DlgTwineToJsonHumanText.TwineHtmlParser.current_tag
current_tag
Definition DlgTwineToJsonHumanText.py:492

DlgTwineToJsonHumanText.TwineHtmlParser.HTML_ATTR_NAME
str HTML_ATTR_NAME
Definition DlgTwineToJsonHumanText.py:485

DlgTwineToJsonHumanText.TwineHtmlParser.handle_starttag
handle_starttag(self, tag, attrs)
Definition DlgTwineToJsonHumanText.py:495

DlgTwineToJsonHumanText.TwineHtmlParser.handle_data
handle_data(self, data)
Definition DlgTwineToJsonHumanText.py:529

DlgTwineToJsonHumanText.TwineHtmlParser.handle_endtag
handle_endtag(self, tag)
Definition DlgTwineToJsonHumanText.py:519

DlgTwineToJsonHumanText.TwineHtmlParser.handle_entityref
handle_entityref(self, name)
Definition DlgTwineToJsonHumanText.py:541

DlgTwineToJsonHumanText.TwineHtmlParser.handle_charref
handle_charref(self, name)
Definition DlgTwineToJsonHumanText.py:545

DlgTwineToJsonHumanText.TwineHtmlParser.handle_decl
handle_decl(self, data)
Definition DlgTwineToJsonHumanText.py:552

DlgTwineToJsonHumanText.TwineHtmlParser.HTML_TAG_STORYDATA
str HTML_TAG_STORYDATA
Definition DlgTwineToJsonHumanText.py:482

DlgTwineToJsonHumanText.TwineHtmlParser.HTML_ATTR_GUID
str HTML_ATTR_GUID
Definition DlgTwineToJsonHumanText.py:487

DlgTwineToJsonHumanText.TwineInnerEdgeData
Definition DlgTwineToJsonHumanText.py:214

DlgTwineToJsonHumanText.TwineInnerEdgeData.__str__
__str__(self)
Definition DlgTwineToJsonHumanText.py:280

DlgTwineToJsonHumanText.TwineInnerEdgeData.speaker
speaker
Definition DlgTwineToJsonHumanText.py:222

DlgTwineToJsonHumanText.TwineInnerEdgeData.REGEX_EDGE_TEXT
str REGEX_EDGE_TEXT
Definition DlgTwineToJsonHumanText.py:217

DlgTwineToJsonHumanText.TwineInnerEdgeData.text
text
Definition DlgTwineToJsonHumanText.py:223

DlgTwineToJsonHumanText.TwineInnerEdgeData.to_dict
to_dict(self)
Definition DlgTwineToJsonHumanText.py:269

DlgTwineToJsonHumanText.TwineInnerEdgeData.edge_text
edge_text
Definition DlgTwineToJsonHumanText.py:224

DlgTwineToJsonHumanText.TwineInnerEdgeData.__repr__
__repr__(self)
Definition DlgTwineToJsonHumanText.py:283

DlgTwineToJsonHumanText.TwineInnerEdgeData.owner_node_index
owner_node_index
Definition DlgTwineToJsonHumanText.py:225

DlgTwineToJsonHumanText.TwineInnerEdgeData.parse
parse(self)
Definition DlgTwineToJsonHumanText.py:227

DlgTwineToJsonHumanText.TwineInnerEdgeData.REGEX_TEXT
str REGEX_TEXT
Definition DlgTwineToJsonHumanText.py:216

DlgTwineToJsonHumanText.TwineInnerEdgeData.REGEX_SPEAKER
str REGEX_SPEAKER
Definition DlgTwineToJsonHumanText.py:215

DlgTwineToJsonHumanText.TwineInnerEdgeData.__init__
__init__(self)
Definition DlgTwineToJsonHumanText.py:219

DlgTwineToJsonHumanText.TwineInnerEdgeData.raw_data
raw_data
Definition DlgTwineToJsonHumanText.py:220

DlgTwineToJsonHumanText.TwineNodeData
Definition DlgTwineToJsonHumanText.py:287

DlgTwineToJsonHumanText.TwineNodeData.raw_name
raw_name
Definition DlgTwineToJsonHumanText.py:291

DlgTwineToJsonHumanText.TwineNodeData.is_node_speech
is_node_speech(self)
Definition DlgTwineToJsonHumanText.py:380

DlgTwineToJsonHumanText.TwineNodeData.raw_data
raw_data
Definition DlgTwineToJsonHumanText.py:292

DlgTwineToJsonHumanText.TwineNodeData.is_node_selector_random
is_node_selector_random(self)
Definition DlgTwineToJsonHumanText.py:395

DlgTwineToJsonHumanText.TwineNodeData.parse
parse(self)
Definition DlgTwineToJsonHumanText.py:354

DlgTwineToJsonHumanText.TwineNodeData.can_have_text
can_have_text(self)
Definition DlgTwineToJsonHumanText.py:368

DlgTwineToJsonHumanText.TwineNodeData.tags
tags
Definition DlgTwineToJsonHumanText.py:299

DlgTwineToJsonHumanText.TwineNodeData.is_node_virtual_parent
is_node_virtual_parent(self)
Definition DlgTwineToJsonHumanText.py:383

DlgTwineToJsonHumanText.TwineNodeData.to_dict
to_dict(self)
Definition DlgTwineToJsonHumanText.py:398

DlgTwineToJsonHumanText.TwineNodeData._parse_text
_parse_text(self)
Definition DlgTwineToJsonHumanText.py:312

DlgTwineToJsonHumanText.TwineNodeData.is_node_selector
is_node_selector(self)
Definition DlgTwineToJsonHumanText.py:389

DlgTwineToJsonHumanText.TwineNodeData.is_node_speech_sequence
is_node_speech_sequence(self)
Definition DlgTwineToJsonHumanText.py:386

DlgTwineToJsonHumanText.TwineNodeData.__get_raw_data_until_edges
__get_raw_data_until_edges(self)
Definition DlgTwineToJsonHumanText.py:303

DlgTwineToJsonHumanText.TwineNodeData.node_index
node_index
Definition DlgTwineToJsonHumanText.py:296

DlgTwineToJsonHumanText.TwineNodeData.can_have_text_on_edges
can_have_text_on_edges(self)
Definition DlgTwineToJsonHumanText.py:371

DlgTwineToJsonHumanText.TwineNodeData.edges
edges
Definition DlgTwineToJsonHumanText.py:300

DlgTwineToJsonHumanText.TwineNodeData.__str__
__str__(self)
Definition DlgTwineToJsonHumanText.py:429

DlgTwineToJsonHumanText.TwineNodeData.is_node_start
is_node_start(self)
Definition DlgTwineToJsonHumanText.py:374

DlgTwineToJsonHumanText.TwineNodeData._parse_edges
_parse_edges(self)
Definition DlgTwineToJsonHumanText.py:318

DlgTwineToJsonHumanText.TwineNodeData.is_node_end
is_node_end(self)
Definition DlgTwineToJsonHumanText.py:377

DlgTwineToJsonHumanText.TwineNodeData.__repr__
__repr__(self)
Definition DlgTwineToJsonHumanText.py:432

DlgTwineToJsonHumanText.TwineNodeData.is_node_selector_first
is_node_selector_first(self)
Definition DlgTwineToJsonHumanText.py:392

DlgTwineToJsonHumanText.TwineNodeData._parse_inner_edges
_parse_inner_edges(self)
Definition DlgTwineToJsonHumanText.py:337

DlgTwineToJsonHumanText.TwineNodeData.raw_tags
raw_tags
Definition DlgTwineToJsonHumanText.py:293

DlgTwineToJsonHumanText.TwineNodeData.text
text
Definition DlgTwineToJsonHumanText.py:298

DlgTwineToJsonHumanText.TwineNodeData.inner_edges
inner_edges
Definition DlgTwineToJsonHumanText.py:301

DlgTwineToJsonHumanText.TwineNodeData.speaker
speaker
Definition DlgTwineToJsonHumanText.py:297

DlgTwineToJsonHumanText.TwineNodeData.REGEX_EDGES
str REGEX_EDGES
Definition DlgTwineToJsonHumanText.py:288

DlgTwineToJsonHumanText.TwineNodeData.__init__
__init__(self)
Definition DlgTwineToJsonHumanText.py:290

DlgTwineToJsonHumanText.TwineNodeTag
Definition DlgTwineToJsonHumanText.py:105

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SELECTOR_RANDOM
str NODE_SELECTOR_RANDOM
Definition DlgTwineToJsonHumanText.py:112

DlgTwineToJsonHumanText.TwineNodeTag.NODE_END
str NODE_END
Definition DlgTwineToJsonHumanText.py:107

DlgTwineToJsonHumanText.TwineNodeTag.NODE_VIRTUAL_PARENT
str NODE_VIRTUAL_PARENT
Definition DlgTwineToJsonHumanText.py:108

DlgTwineToJsonHumanText.TwineNodeTag.has_valid_tags
has_valid_tags(cls, tags_list)
Definition DlgTwineToJsonHumanText.py:123

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SPEECH_SEQUENCE
NODE_SPEECH_SEQUENCE
Definition DlgTwineToJsonHumanText.py:116

DlgTwineToJsonHumanText.TwineNodeTag.NODE_VIRTUAL_PARENT
NODE_VIRTUAL_PARENT
Definition DlgTwineToJsonHumanText.py:116

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SELECTOR_FIRST
str NODE_SELECTOR_FIRST
Definition DlgTwineToJsonHumanText.py:111

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SELECTOR_FIRST
NODE_SELECTOR_FIRST
Definition DlgTwineToJsonHumanText.py:116

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SPEECH
NODE_SPEECH
Definition DlgTwineToJsonHumanText.py:116

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SPEECH_SEQUENCE
str NODE_SPEECH_SEQUENCE
Definition DlgTwineToJsonHumanText.py:110

DlgTwineToJsonHumanText.TwineNodeTag.NODE_START
str NODE_START
Definition DlgTwineToJsonHumanText.py:106

DlgTwineToJsonHumanText.TwineNodeTag.get_all_tags
get_all_tags(cls)
Definition DlgTwineToJsonHumanText.py:115

DlgTwineToJsonHumanText.TwineNodeTag.is_valid_tag
is_valid_tag(cls, tag)
Definition DlgTwineToJsonHumanText.py:119

DlgTwineToJsonHumanText.TwineNodeTag.NODE_SPEECH
str NODE_SPEECH
Definition DlgTwineToJsonHumanText.py:109

DlgTwineToJsonHumanText.TwineNodeTag.NODE_START
NODE_START
Definition DlgTwineToJsonHumanText.py:116

DlgTwineToJsonHumanText.TwineNodeTag.NODE_END
NODE_END
Definition DlgTwineToJsonHumanText.py:116

bool

DlgTwineToJsonHumanText.print_red_light
print_red_light(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:65

DlgTwineToJsonHumanText.convert_path_to_absolute_if_not_already
convert_path_to_absolute_if_not_already(path)
Definition DlgTwineToJsonHumanText.py:570

DlgTwineToJsonHumanText.exit_program_error
exit_program_error(message=None)
Definition DlgTwineToJsonHumanText.py:560

DlgTwineToJsonHumanText.print_blue_light
print_blue_light(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:73

DlgTwineToJsonHumanText.print_green_light
print_green_light(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:89

DlgTwineToJsonHumanText.print_blue
print_blue(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:69

DlgTwineToJsonHumanText.twine_parse_file
twine_parse_file(path)
Definition DlgTwineToJsonHumanText.py:604

DlgTwineToJsonHumanText.exit_program_success
exit_program_success()
Definition DlgTwineToJsonHumanText.py:566

DlgTwineToJsonHumanText.print_yellow
print_yellow(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:77

DlgTwineToJsonHumanText.main
main(src_twine_dir, dst_json_dir)
Definition DlgTwineToJsonHumanText.py:666

DlgTwineToJsonHumanText.print_green
print_green(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:85

DlgTwineToJsonHumanText.export_twine_file_dlg_text_json
export_twine_file_dlg_text_json(src_file_path, src_twine_dir_from, dst_json_dir)
Definition DlgTwineToJsonHumanText.py:618

DlgTwineToJsonHumanText.print_red
print_red(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:61

DlgTwineToJsonHumanText.exit_program
exit_program(status)
Definition DlgTwineToJsonHumanText.py:556

DlgTwineToJsonHumanText.print_reset_color
print_reset_color()
Definition DlgTwineToJsonHumanText.py:45

DlgTwineToJsonHumanText.print_config_value
print_config_value(config_name, config_value)
Definition DlgTwineToJsonHumanText.py:93

DlgTwineToJsonHumanText.print_yellow_light
print_yellow_light(*args, **kwargs)
Definition DlgTwineToJsonHumanText.py:81

DlgTwineToJsonHumanText.json_save_dictionary
json_save_dictionary(path, dictionary)
Definition DlgTwineToJsonHumanText.py:592

DlgTwineToJsonHumanText._print_internal
_print_internal(color, string, **kwargs)
Definition DlgTwineToJsonHumanText.py:50

DlgTwineToJsonHumanText.is_path_twine_file
is_path_twine_file(path)
Definition DlgTwineToJsonHumanText.py:577

DlgTwineToJsonHumanText.string_to_int
string_to_int(string)
Definition DlgTwineToJsonHumanText.py:98

DlgTwineToJsonHumanText.print_newlines
print_newlines(nr=1)
Definition DlgTwineToJsonHumanText.py:40