Skip to content

Latest commit

 

History

History
180 lines (159 loc) · 4.22 KB

README.md

File metadata and controls

180 lines (159 loc) · 4.22 KB

The Catalogue of Endangered Languages as CLDF dataset

How to cite

If you use these data please cite

Description

This dataset is licensed under a CC-BY-4.0 license

Available online at https://endangeredlanguages.com

Parameters

This dataset contains three sets of parameters.

  • The four categories from which the Language Endangerment Index is derived.
  • The computed Language Endangerment Index.
  • Parameters with composite JSON values, aggregating information from a specific source on a particular topic. Below is a list of JSON schemas describing the values of these parameters.

context

{
    "type": "object",
    "properties": {
        "Domains Other Langs": {
            "type": "array",
            "items": {
                "type": "string"
            }
        },
        "Government Support": {
            "type": "string"
        },
        "Institutional Support": {
            "type": "string"
        },
        "Number Speaker Other Languages": {
            "type": "string"
        },
        "Other Languages Used": {
            "type": "string"
        },
        "Speaker Attitude": {
            "type": "string"
        }
    }
}

location

{
    "type": "object",
    "properties": {
        "Coordinates": {
            "type": "array",
            "items": {
                "type": "array",
                "prefixItems": [
                    {
                        "title": "latitude",
                        "type": "number",
                        "minimum": -90,
                        "maximum": 90
                    },
                    {
                        "title": "longitude",
                        "type": "number",
                        "minimum": -180,
                        "maximum": 180
                    }
                ]
            }
        },
        "Description": {
            "type": "string"
        },
        "Places": {
            "type": "array",
            "items": {
                "type": "string"
            }
        }
    }
}

speakers

{
    "type": "object",
    "properties": {
        "Speaker Number Text": {
            "type": "string"
        },
        "Speaker Number": {
            "type": "string"
        },
        "Elders": {
            "type": "string"
        },
        "Ethnic Population": {
            "type": "string"
        },
        "Older Adults": {
            "type": "string"
        },
        "Second Language Speakers": {
            "type": "string"
        },
        "Semi Speakers": {
            "type": "string"
        },
        "Young Adults": {
            "type": "string"
        },
        "Date Of Info": {
            "type": "string"
        }
    }
}

vitality

{
    "type": "object",
    "properties": {
        "Endangerment": {
            "type": "object",
            "properties": {
                "Level": {
                    "enum": [
                        "safe",
                        "at risk",
                        "vulnerable",
                        "threatened",
                        "endangered",
                        "severely endangered",
                        "critically endangered",
                        "awakening",
                        "dormant"
                    ]
                },
                "Certainty": {
                    "type": "number",
                    "minimum": 0,
                    "maximum": 1
                }
            }
        },
        "Domains Of Use": {
            "type": "string"
        },
        "Speaker Number Trends": {
            "type": "string"
        },
        "Transmission": {
            "type": "string"
        }
    }
}

CLDF Datasets

The following CLDF datasets are available in cldf: