Skip to content
Snippets Groups Projects
config_global_1.1.json 1.34 KiB
{
    "usecase_description": "Config file for usecase_1 : from a raw text, get the same text but with EDU bracket.",
    "data_raw": {
        "name": "edgar_poe_en",
        "exte": ".txt",
        "language": "en",
        "existing_metadata": true
    },
    "steps":{
        "main": "annotation",
        "pre-processing": {
            "to_do": true,
            "syntactic_tool": "stanza",
            "sentence_split": true,
            "tokenization": true,
            "syntactic_parsing": false,
            "create_metadata": {
                "to_do": true,
                "line": "paragraph",
                "sent": "sent"
            }
        },
        "discourse_segmenter": {
            "model": "/home/lriviere/andiamo/discut/Results_conllu/results_eng.rst.gum-eng_bert/model.tar.gz",
            "training": {
                "toolkit": null,
                "pre_trained_lm": null,
                "config_file": null,
                "train_data_path": null,
                "validation_data_path": null
            }
        },
        "evaluation": true,
        "gold_test_data_path": null
    },
    "output":{
        "conll_file":{
            "to_do": true,
            "metadata": true,
            "with_gold_labels": false
        },
        "txt_file":{
            "to_do": false,
            "metadata": true
        }
    }
}